loaded library: /usr/lib/x86_64-linux-gnu/libibverbs.so.1 ***************************************** Setting OMP_NUM_THREADS environment variable for each process to be 1 in default, to avoid your system being overloaded, please further tune the variable for optimal performance in your application as needed. ***************************************** loaded library: loaded library: loaded library: loaded library: loaded library: /usr/lib/x86_64-linux-gnu/libibverbs.so.1/usr/lib/x86_64-linux-gnu/libibverbs.so.1/usr/lib/x86_64-linux-gnu/libibverbs.so.1/usr/lib/x86_64-linux-gnu/libibverbs.so.1 /usr/lib/x86_64-linux-gnu/libibverbs.so.1 loaded library: loaded library: /usr/lib/x86_64-linux-gnu/libibverbs.so.1/usr/lib/x86_64-linux-gnu/libibverbs.so.1 loaded library: /usr/lib/x86_64-linux-gnu/libibverbs.so.1 W20220411 00:54:14.590472 2300 rpc_client.cpp:190] LoadServer 10.7.222.219 Failed at 0 times error_code 14 error_message failed to connect to all addresses W20220411 00:54:14.593068 2302 rpc_client.cpp:190] LoadServer 10.7.222.219 Failed at 0 times error_code 14 error_message failed to connect to all addresses ------------------------ arguments ------------------------ batches_per_epoch ............................... 834 channel_last .................................... False ddp ............................................. True exit_num ........................................ -1 fuse_bn_add_relu ................................ False fuse_bn_relu .................................... False gpu_stat_file ................................... None grad_clipping ................................... 0.0 graph ........................................... False label_smoothing ................................. 0.1 learning_rate ................................... 1.536 legacy_init ..................................... False load_path ....................................... None lr_decay_type ................................... cosine metric_local .................................... True metric_train_acc ................................ True momentum ........................................ 0.875 nccl_fusion_max_ops ............................. 24 nccl_fusion_threshold_mb ........................ 16 num_classes ..................................... 1000 num_devices_per_node ............................ 8 num_epochs ...................................... 50 num_nodes ....................................... 1 ofrecord_part_num ............................... 256 ofrecord_path ................................... /dataset/79846248 print_interval .................................. 100 print_timestamp ................................. False samples_per_epoch ............................... 1281167 save_init ....................................... False save_path ....................................... None scale_grad ...................................... False skip_eval ....................................... False synthetic_data .................................. False total_batches ................................... -1 train_batch_size ................................ 192 train_global_batch_size ......................... 1536 use_fp16 ........................................ False use_gpu_decode .................................. False val_batch_size .................................. 50 val_batches_per_epoch ........................... 125 val_global_batch_size ........................... 400 val_samples_per_epoch ........................... 50000 warmup_epochs ................................... 5 weight_decay .................................... 3.0517578125e-05 zero_init_residual .............................. True -------------------- end of arguments --------------------- ***** Model Init ***** ***** Model Init Finish, time escapled: 2.71685 s ***** [rank:4] [train], epoch: 0/50, iter: 100/834, loss: 0.85863, lr: 0.035933, top1: 0.00417, throughput: 284.46 | 2022-04-11 00:55:37.172 [rank:2] [train], epoch: 0/50, iter: 100/834, loss: 0.85853, lr: 0.035933, top1: 0.00380, throughput: 284.14 | 2022-04-11 00:55:37.175 [rank:7] [train], epoch: 0/50, iter: 100/834, loss: 0.85857, lr: 0.035933, top1: 0.00500, throughput: 284.26 | 2022-04-11 00:55:37.174 [rank:0] [train], epoch: 0/50, iter: 100/834, loss: 0.85896, lr: 0.035933, top1: 0.00344, throughput: 284.08 | 2022-04-11 00:55:37.192 [rank:3] [train], epoch: 0/50, iter: 100/834, loss: 0.85904, lr: 0.035933, top1: 0.00432, throughput: 284.30 | 2022-04-11 00:55:37.198 [rank:1] [train], epoch: 0/50, iter: 100/834, loss: 0.85865, lr: 0.035933, top1: 0.00422, throughput: 284.28 | 2022-04-11 00:55:37.201 [rank:6] [train], epoch: 0/50, iter: 100/834, loss: 0.85885, lr: 0.035933, top1: 0.00391, throughput: 284.22 | 2022-04-11 00:55:37.238 [rank:5] [train], epoch: 0/50, iter: 100/834, loss: 0.85890, lr: 0.035933, top1: 0.00443, throughput: 284.20 | 2022-04-11 00:55:37.251 timestamp, name, driver_version, utilization.gpu [%], utilization.memory [%], memory.total [MiB], memory.free [MiB], memory.used [MiB] 2022/04/11 00:55:37.529, Tesla V100-SXM2-32GB, 470.57.02, 99 %, 62 %, 32510 MiB, 11750 MiB, 20760 MiB timestamp, name, driver_version, utilization.gpu [%], utilization.memory [%], memory.total [MiB], memory.free [MiB], memory.used [MiB] timestamp, name, driver_version, utilization.gpu [%], utilization.memory [%], memory.total [MiB], memory.free [MiB], memory.used [MiB] 2022/04/11 00:55:37.555, Tesla V100-SXM2-32GB, 470.57.02, 97 %, 73 %, 32510 MiB, 11770 MiB, 20740 MiB 2022/04/11 00:55:37.563, Tesla V100-SXM2-32GB, 470.57.02, 99 %, 62 %, 32510 MiB, 11750 MiB, 20760 MiB 2022/04/11 00:55:37.568, Tesla V100-SXM2-32GB, 470.57.02, 99 %, 62 %, 32510 MiB, 11750 MiB, 20760 MiB 2022/04/11 00:55:37.579, Tesla V100-SXM2-32GB, 470.57.02, 100 %, 56 %, 32510 MiB, 11846 MiB, 20664 MiB 2022/04/11 00:55:37.600, Tesla V100-SXM2-32GB, 470.57.02, 100 %, 52 %, 32510 MiB, 11770 MiB, 20740 MiB 2022/04/11 00:55:37.601, Tesla V100-SXM2-32GB, 470.57.02, 100 %, 52 %, 32510 MiB, 11770 MiB, 20740 MiB 2022/04/11 00:55:37.617, Tesla V100-SXM2-32GB, 470.57.02, 99 %, 56 %, 32510 MiB, 11822 MiB, 20688 MiB 2022/04/11 00:55:37.635, Tesla V100-SXM2-32GB, 470.57.02, 100 %, 56 %, 32510 MiB, 11846 MiB, 20664 MiB 2022/04/11 00:55:37.636, Tesla V100-SXM2-32GB, 470.57.02, 100 %, 56 %, 32510 MiB, 11846 MiB, 20664 MiB 2022/04/11 00:55:37.655, Tesla V100-SXM2-32GB, 470.57.02, 100 %, 59 %, 32510 MiB, 11830 MiB, 20680 MiB 2022/04/11 00:55:37.671, Tesla V100-SXM2-32GB, 470.57.02, 99 %, 56 %, 32510 MiB, 11822 MiB, 20688 MiB 2022/04/11 00:55:37.672, Tesla V100-SXM2-32GB, 470.57.02, 99 %, 56 %, 32510 MiB, 11822 MiB, 20688 MiB timestamp, name, driver_version, utilization.gpu [%], utilization.memory [%], memory.total [MiB], memory.free [MiB], memory.used [MiB] timestamp, name, driver_version, utilization.gpu [%], utilization.memory [%], memory.total [MiB], memory.free [MiB], memory.used [MiB] 2022/04/11 00:55:37.679, Tesla V100-SXM2-32GB, 470.57.02, 100 %, 57 %, 32510 MiB, 11762 MiB, 20748 MiB 2022/04/11 00:55:37.695, Tesla V100-SXM2-32GB, 470.57.02, 100 %, 59 %, 32510 MiB, 11830 MiB, 20680 MiB 2022/04/11 00:55:37.696, Tesla V100-SXM2-32GB, 470.57.02, 100 %, 59 %, 32510 MiB, 11830 MiB, 20680 MiB 2022/04/11 00:55:37.711, Tesla V100-SXM2-32GB, 470.57.02, 99 %, 64 %, 32510 MiB, 11706 MiB, 20804 MiB 2022/04/11 00:55:37.710, Tesla V100-SXM2-32GB, 470.57.02, 100 %, 58 %, 32510 MiB, 11750 MiB, 20760 MiB 2022/04/11 00:55:37.711, Tesla V100-SXM2-32GB, 470.57.02, 100 %, 58 %, 32510 MiB, 11750 MiB, 20760 MiB timestamp, name, driver_version, utilization.gpu [%], utilization.memory [%], memory.total [MiB], memory.free [MiB], memory.used [MiB] 2022/04/11 00:55:37.716, Tesla V100-SXM2-32GB, 470.57.02, 100 %, 57 %, 32510 MiB, 11762 MiB, 20748 MiB 2022/04/11 00:55:37.720, Tesla V100-SXM2-32GB, 470.57.02, 100 %, 57 %, 32510 MiB, 11762 MiB, 20748 MiB 2022/04/11 00:55:37.732, Tesla V100-SXM2-32GB, 470.57.02, 100 %, 54 %, 32510 MiB, 11786 MiB, 20724 MiB 2022/04/11 00:55:37.734, Tesla V100-SXM2-32GB, 470.57.02, 100 %, 64 %, 32510 MiB, 11770 MiB, 20740 MiB 2022/04/11 00:55:37.734, Tesla V100-SXM2-32GB, 470.57.02, 100 %, 64 %, 32510 MiB, 11770 MiB, 20740 MiB 2022/04/11 00:55:37.736, Tesla V100-SXM2-32GB, 470.57.02, 100 %, 58 %, 32510 MiB, 11750 MiB, 20760 MiB 2022/04/11 00:55:37.740, Tesla V100-SXM2-32GB, 470.57.02, 99 %, 68 %, 32510 MiB, 11706 MiB, 20804 MiB 2022/04/11 00:55:37.750, Tesla V100-SXM2-32GB, 470.57.02, 99 %, 68 %, 32510 MiB, 11706 MiB, 20804 MiB 2022/04/11 00:55:37.766, Tesla V100-SXM2-32GB, 470.57.02, 100 %, 61 %, 32510 MiB, 11846 MiB, 20664 MiB 2022/04/11 00:55:37.766, Tesla V100-SXM2-32GB, 470.57.02, 100 %, 61 %, 32510 MiB, 11846 MiB, 20664 MiB timestamp, name, driver_version, utilization.gpu [%], utilization.memory [%], memory.total [MiB], memory.free [MiB], memory.used [MiB] 2022/04/11 00:55:37.771, Tesla V100-SXM2-32GB, 470.57.02, 100 %, 64 %, 32510 MiB, 11770 MiB, 20740 MiB 2022/04/11 00:55:37.775, Tesla V100-SXM2-32GB, 470.57.02, 100 %, 69 %, 32510 MiB, 11786 MiB, 20724 MiB 2022/04/11 00:55:37.776, Tesla V100-SXM2-32GB, 470.57.02, 100 %, 69 %, 32510 MiB, 11786 MiB, 20724 MiB 2022/04/11 00:55:37.785, Tesla V100-SXM2-32GB, 470.57.02, 100 %, 59 %, 32510 MiB, 11822 MiB, 20688 MiB 2022/04/11 00:55:37.786, Tesla V100-SXM2-32GB, 470.57.02, 100 %, 59 %, 32510 MiB, 11822 MiB, 20688 MiB 2022/04/11 00:55:37.787, Tesla V100-SXM2-32GB, 470.57.02, 100 %, 56 %, 32510 MiB, 11750 MiB, 20760 MiB 2022/04/11 00:55:37.788, Tesla V100-SXM2-32GB, 470.57.02, 100 %, 61 %, 32510 MiB, 11846 MiB, 20664 MiB timestamp, name, driver_version, utilization.gpu [%], utilization.memory [%], memory.total [MiB], memory.free [MiB], memory.used [MiB] 2022/04/11 00:55:37.808, Tesla V100-SXM2-32GB, 470.57.02, 100 %, 56 %, 32510 MiB, 11830 MiB, 20680 MiB 2022/04/11 00:55:37.808, Tesla V100-SXM2-32GB, 470.57.02, 100 %, 56 %, 32510 MiB, 11830 MiB, 20680 MiB 2022/04/11 00:55:37.817, Tesla V100-SXM2-32GB, 470.57.02, 100 %, 64 %, 32510 MiB, 11770 MiB, 20740 MiB 2022/04/11 00:55:37.820, Tesla V100-SXM2-32GB, 470.57.02, 100 %, 59 %, 32510 MiB, 11822 MiB, 20688 MiB 2022/04/11 00:55:37.827, Tesla V100-SXM2-32GB, 470.57.02, 100 %, 56 %, 32510 MiB, 11750 MiB, 20760 MiB 2022/04/11 00:55:37.831, Tesla V100-SXM2-32GB, 470.57.02, 92 %, 64 %, 32510 MiB, 11762 MiB, 20748 MiB 2022/04/11 00:55:37.831, Tesla V100-SXM2-32GB, 470.57.02, 92 %, 64 %, 32510 MiB, 11762 MiB, 20748 MiB 2022/04/11 00:55:37.833, Tesla V100-SXM2-32GB, 470.57.02, 81 %, 31 %, 32510 MiB, 11846 MiB, 20664 MiB 2022/04/11 00:55:37.845, Tesla V100-SXM2-32GB, 470.57.02, 100 %, 56 %, 32510 MiB, 11830 MiB, 20680 MiB 2022/04/11 00:55:37.849, Tesla V100-SXM2-32GB, 470.57.02, 100 %, 64 %, 32510 MiB, 11770 MiB, 20740 MiB 2022/04/11 00:55:37.856, Tesla V100-SXM2-32GB, 470.57.02, 99 %, 68 %, 32510 MiB, 11706 MiB, 20804 MiB 2022/04/11 00:55:37.856, Tesla V100-SXM2-32GB, 470.57.02, 99 %, 68 %, 32510 MiB, 11706 MiB, 20804 MiB 2022/04/11 00:55:37.858, Tesla V100-SXM2-32GB, 470.57.02, 100 %, 59 %, 32510 MiB, 11822 MiB, 20688 MiB 2022/04/11 00:55:37.860, Tesla V100-SXM2-32GB, 470.57.02, 92 %, 64 %, 32510 MiB, 11762 MiB, 20748 MiB 2022/04/11 00:55:37.864, Tesla V100-SXM2-32GB, 470.57.02, 81 %, 31 %, 32510 MiB, 11846 MiB, 20664 MiB 2022/04/11 00:55:37.866, Tesla V100-SXM2-32GB, 470.57.02, 100 %, 69 %, 32510 MiB, 11786 MiB, 20724 MiB 2022/04/11 00:55:37.866, Tesla V100-SXM2-32GB, 470.57.02, 100 %, 69 %, 32510 MiB, 11786 MiB, 20724 MiB 2022/04/11 00:55:37.868, Tesla V100-SXM2-32GB, 470.57.02, 100 %, 56 %, 32510 MiB, 11830 MiB, 20680 MiB 2022/04/11 00:55:37.876, Tesla V100-SXM2-32GB, 470.57.02, 99 %, 68 %, 32510 MiB, 11706 MiB, 20804 MiB 2022/04/11 00:55:37.882, Tesla V100-SXM2-32GB, 470.57.02, 70 %, 37 %, 32510 MiB, 11822 MiB, 20688 MiB 2022/04/11 00:55:37.891, Tesla V100-SXM2-32GB, 470.57.02, 92 %, 64 %, 32510 MiB, 11762 MiB, 20748 MiB 2022/04/11 00:55:37.893, Tesla V100-SXM2-32GB, 470.57.02, 100 %, 69 %, 32510 MiB, 11786 MiB, 20724 MiB 2022/04/11 00:55:37.897, Tesla V100-SXM2-32GB, 470.57.02, 100 %, 56 %, 32510 MiB, 11830 MiB, 20680 MiB 2022/04/11 00:55:37.899, Tesla V100-SXM2-32GB, 470.57.02, 99 %, 68 %, 32510 MiB, 11706 MiB, 20804 MiB 2022/04/11 00:55:37.902, Tesla V100-SXM2-32GB, 470.57.02, 92 %, 64 %, 32510 MiB, 11762 MiB, 20748 MiB 2022/04/11 00:55:37.903, Tesla V100-SXM2-32GB, 470.57.02, 100 %, 69 %, 32510 MiB, 11786 MiB, 20724 MiB 2022/04/11 00:55:37.905, Tesla V100-SXM2-32GB, 470.57.02, 99 %, 68 %, 32510 MiB, 11706 MiB, 20804 MiB 2022/04/11 00:55:37.908, Tesla V100-SXM2-32GB, 470.57.02, 100 %, 69 %, 32510 MiB, 11786 MiB, 20724 MiB [rank:2] [train], epoch: 0/50, iter: 200/834, loss: 0.82525, lr: 0.071866, top1: 0.01354, throughput: 308.73 | 2022-04-11 00:56:39.364 [rank:6] [train], epoch: 0/50, iter: 200/834, loss: 0.82594, lr: 0.071866, top1: 0.01339, throughput: 308.99 | 2022-04-11 00:56:39.375 [rank:5] [train], epoch: 0/50, iter: 200/834, loss: 0.82510, lr: 0.071866, top1: 0.01401, throughput: 309.02 | 2022-04-11 00:56:39.383 [rank:1] [train], epoch: 0/50, iter: 200/834, loss: 0.82505, lr: 0.071866, top1: 0.01323, throughput: 308.76 | 2022-04-11 00:56:39.384 [rank:3] [train], epoch: 0/50, iter: 200/834, loss: 0.82599, lr: 0.071866, top1: 0.01401, throughput: 308.97 | 2022-04-11 00:56:39.340 [rank:4] [train], epoch: 0/50, iter: 200/834, loss: 0.82606, lr: 0.071866, top1: 0.01286, throughput: 308.35 | 2022-04-11 00:56:39.439 [rank:7] [train], epoch: 0/50, iter: 200/834, loss: 0.82711, lr: 0.071866, top1: 0.01370, throughput: 308.35 | 2022-04-11 00:56:39.442 [rank:0] [train], epoch: 0/50, iter: 200/834, loss: 0.82672, lr: 0.071866, top1: 0.01411, throughput: 308.39 | 2022-04-11 00:56:39.451 [rank:2] [train], epoch: 0/50, iter: 300/834, loss: 0.80312, lr: 0.107799, top1: 0.01859, throughput: 311.79 | 2022-04-11 00:57:40.944 [rank:6] [train], epoch: 0/50, iter: 300/834, loss: 0.80273, lr: 0.107799, top1: 0.01990, throughput: 311.55 | 2022-04-11 00:57:41.003 [rank:7] [train], epoch: 0/50, iter: 300/834, loss: 0.80211, lr: 0.107799, top1: 0.01844, throughput: 311.72 | 2022-04-11 00:57:41.036 [rank:0] [train], epoch: 0/50, iter: 300/834, loss: 0.80262, lr: 0.107799, top1: 0.01833, throughput: 311.74 | 2022-04-11 00:57:41.040 [rank:1] [train], epoch: 0/50, iter: 300/834, loss: 0.80235, lr: 0.107799, top1: 0.02036, throughput: 311.36 | 2022-04-11 00:57:41.049 [rank:3] [train], epoch: 0/50, iter: 300/834, loss: 0.80177, lr: 0.107799, top1: 0.02047, throughput: 311.07 | 2022-04-11 00:57:41.063 [rank:4] [train], epoch: 0/50, iter: 300/834, loss: 0.80257, lr: 0.107799, top1: 0.01943, throughput: 311.47 | 2022-04-11 00:57:41.083 [rank:5] [train], epoch: 0/50, iter: 300/834, loss: 0.80118, lr: 0.107799, top1: 0.02125, throughput: 311.07 | 2022-04-11 00:57:41.105 [rank:5] [train], epoch: 0/50, iter: 400/834, loss: 0.78632, lr: 0.143733, top1: 0.02531, throughput: 312.90 | 2022-04-11 00:58:42.467 [rank:6] [train], epoch: 0/50, iter: 400/834, loss: 0.78556, lr: 0.143733, top1: 0.02583, throughput: 312.36 | 2022-04-11 00:58:42.470 [rank:4] [train], epoch: 0/50, iter: 400/834, loss: 0.78554, lr: 0.143733, top1: 0.02479, throughput: 312.71 | 2022-04-11 00:58:42.481 [rank:2] [train], epoch: 0/50, iter: 400/834, loss: 0.78505, lr: 0.143733, top1: 0.02635, throughput: 312.00 | 2022-04-11 00:58:42.481 [rank:3] [train], epoch: 0/50, iter: 400/834, loss: 0.78569, lr: 0.143733, top1: 0.02563, throughput: 312.58 | 2022-04-11 00:58:42.488 [rank:1] [train], epoch: 0/50, iter: 400/834, loss: 0.78546, lr: 0.143733, top1: 0.02578, throughput: 312.43 | 2022-04-11 00:58:42.503 [rank:7] [train], epoch: 0/50, iter: 400/834, loss: 0.78673, lr: 0.143733, top1: 0.02474, throughput: 312.24 | 2022-04-11 00:58:42.527 [rank:0] [train], epoch: 0/50, iter: 400/834, loss: 0.78607, lr: 0.143733, top1: 0.02641, throughput: 312.22 | 2022-04-11 00:58:42.535 [rank:6] [train], epoch: 0/50, iter: 500/834, loss: 0.77029, lr: 0.179666, top1: 0.03188, throughput: 311.36 | 2022-04-11 00:59:44.135 [rank:1] [train], epoch: 0/50, iter: 500/834, loss: 0.76978, lr: 0.179666, top1: 0.03479, throughput: 311.42 | 2022-04-11 00:59:44.156 [rank:2] [train], epoch: 0/50, iter: 500/834, loss: 0.77189, lr: 0.179666, top1: 0.03255, throughput: 311.30 | 2022-04-11 00:59:44.159 [rank:4] [train], epoch: 0/50, iter: 500/834, loss: 0.77026, lr: 0.179666, top1: 0.03385, throughput: 311.24 | 2022-04-11 00:59:44.170 [rank:5] [train], epoch: 0/50, iter: 500/834, loss: 0.76969, lr: 0.179666, top1: 0.03141, throughput: 311.13 | 2022-04-11 00:59:44.177 [rank:0] [train], epoch: 0/50, iter: 500/834, loss: 0.76869, lr: 0.179666, top1: 0.03417, throughput: 311.44 | 2022-04-11 00:59:44.184 [rank:7] [train], epoch: 0/50, iter: 500/834, loss: 0.77196, lr: 0.179666, top1: 0.03250, throughput: 311.35 | 2022-04-11 00:59:44.194 [rank:3] [train], epoch: 0/50, iter: 500/834, loss: 0.76727, lr: 0.179666, top1: 0.03557, throughput: 311.06 | 2022-04-11 00:59:44.212 [rank:5] [train], epoch: 0/50, iter: 600/834, loss: 0.75201, lr: 0.215599, top1: 0.04547, throughput: 312.50 | 2022-04-11 01:00:45.616 [rank:6] [train], epoch: 0/50, iter: 600/834, loss: 0.75273, lr: 0.215599, top1: 0.04240, throughput: 312.28 | 2022-04-11 01:00:45.618 [rank:3] [train], epoch: 0/50, iter: 600/834, loss: 0.75403, lr: 0.215599, top1: 0.04474, throughput: 312.62 | 2022-04-11 01:00:45.628 [rank:1] [train], epoch: 0/50, iter: 600/834, loss: 0.75484, lr: 0.215599, top1: 0.04312, throughput: 312.31 | 2022-04-11 01:00:45.634 [rank:0] [train], epoch: 0/50, iter: 600/834, loss: 0.75332, lr: 0.215599, top1: 0.04203, throughput: 312.44 | 2022-04-11 01:00:45.636 [rank:4] [train], epoch: 0/50, iter: 600/834, loss: 0.75333, lr: 0.215599, top1: 0.04214, throughput: 312.32 | 2022-04-11 01:00:45.645 [rank:2] [train], epoch: 0/50, iter: 600/834, loss: 0.75344, lr: 0.215599, top1: 0.04292, throughput: 312.14 | 2022-04-11 01:00:45.670 [rank:7] [train], epoch: 0/50, iter: 600/834, loss: 0.75399, lr: 0.215599, top1: 0.04240, throughput: 312.21 | 2022-04-11 01:00:45.690 [rank:2] [train], epoch: 0/50, iter: 700/834, loss: 0.73717, lr: 0.251532, top1: 0.05083, throughput: 312.81 | 2022-04-11 01:01:47.048 [rank:1] [train], epoch: 0/50, iter: 700/834, loss: 0.73644, lr: 0.251532, top1: 0.05271, throughput: 312.56 | 2022-04-11 01:01:47.061 [rank:6] [train], epoch: 0/50, iter: 700/834, loss: 0.73937, lr: 0.251532, top1: 0.05063, throughput: 312.44 | 2022-04-11 01:01:47.071 [rank:7] [train], epoch: 0/50, iter: 700/834, loss: 0.73940, lr: 0.251532, top1: 0.04880, throughput: 312.74 | 2022-04-11 01:01:47.084 [rank:5] [train], epoch: 0/50, iter: 700/834, loss: 0.73890, lr: 0.251532, top1: 0.05380, throughput: 312.31 | 2022-04-11 01:01:47.094 [rank:3] [train], epoch: 0/50, iter: 700/834, loss: 0.73881, lr: 0.251532, top1: 0.05062, throughput: 312.31 | 2022-04-11 01:01:47.106 [rank:0] [train], epoch: 0/50, iter: 700/834, loss: 0.73884, lr: 0.251532, top1: 0.05198, throughput: 312.21 | 2022-04-11 01:01:47.133 [rank:4] [train], epoch: 0/50, iter: 700/834, loss: 0.73793, lr: 0.251532, top1: 0.05156, throughput: 312.22 | 2022-04-11 01:01:47.141 [rank:1] [train], epoch: 0/50, iter: 800/834, loss: 0.72528, lr: 0.287465, top1: 0.05885, throughput: 312.72 | 2022-04-11 01:02:48.457 [rank:2] [train], epoch: 0/50, iter: 800/834, loss: 0.72592, lr: 0.287465, top1: 0.05839, throughput: 312.62 | 2022-04-11 01:02:48.465 [rank:5] [train], epoch: 0/50, iter: 800/834, loss: 0.72514, lr: 0.287465, top1: 0.06026, throughput: 312.82 | 2022-04-11 01:02:48.472 [rank:0] [train], epoch: 0/50, iter: 800/834, loss: 0.72532, lr: 0.287465, top1: 0.05776, throughput: 312.98 | 2022-04-11 01:02:48.478 [rank:3] [train], epoch: 0/50, iter: 800/834, loss: 0.72501, lr: 0.287465, top1: 0.05896, throughput: 312.74 | 2022-04-11 01:02:48.499 [rank:6] [train], epoch: 0/50, iter: 800/834, loss: 0.72221, lr: 0.287465, top1: 0.06047, throughput: 312.50 | 2022-04-11 01:02:48.510 [rank:4] [train], epoch: 0/50, iter: 800/834, loss: 0.72454, lr: 0.287465, top1: 0.05818, throughput: 312.82 | 2022-04-11 01:02:48.517 [rank:7] [train], epoch: 0/50, iter: 800/834, loss: 0.72445, lr: 0.287465, top1: 0.06198, throughput: 312.28 | 2022-04-11 01:02:48.567 [rank:6] [train], epoch: 0/50, iter: 834/834, loss: 0.71171, lr: 0.299682, top1: 0.06893, throughput: 313.83 | 2022-04-11 01:03:09.311 [rank:4] [train], epoch: 0/50, iter: 834/834, loss: 0.71287, lr: 0.299682, top1: 0.06863, throughput: 313.89 | 2022-04-11 01:03:09.314 [rank:5] [train], epoch: 0/50, iter: 834/834, loss: 0.71464, lr: 0.299682, top1: 0.06786, throughput: 313.18 | 2022-04-11 01:03:09.316 [rank:2] [train], epoch: 0/50, iter: 834/834, loss: 0.71223, lr: 0.299682, top1: 0.07123, throughput: 313.00 | 2022-04-11 01:03:09.321 [rank:3] [train], epoch: 0/50, iter: 834/834, loss: 0.71523, lr: 0.299682, top1: 0.06771, throughput: 313.50 | 2022-04-11 01:03:09.322 [rank:7] [train], epoch: 0/50, iter: 834/834, loss: 0.71499, lr: 0.299682, top1: 0.06327, throughput: 314.52 | 2022-04-11 01:03:09.323 [rank:1] [train], epoch: 0/50, iter: 834/834, loss: 0.71320, lr: 0.299682, top1: 0.06419, throughput: 312.73 | 2022-04-11 01:03:09.331 [rank:0] [train], epoch: 0/50, iter: 834/834, loss: 0.71214, lr: 0.299682, top1: 0.06495, throughput: 312.48 | 2022-04-11 01:03:09.369 [rank:1] [eval], epoch: 0/50, iter: 125/125, loss: 0.00000, lr: 0.299682, top1: 0.05920, throughput: 470.42 | 2022-04-11 01:03:22.617 [rank:0] [eval], epoch: 0/50, iter: 125/125, loss: 0.00000, lr: 0.299682, top1: 0.05520, throughput: 471.68 | 2022-04-11 01:03:22.620 [rank:4] [eval], epoch: 0/50, iter: 125/125, loss: 0.00000, lr: 0.299682, top1: 0.05728, throughput: 469.56 | 2022-04-11 01:03:22.625 [rank:5] [eval], epoch: 0/50, iter: 125/125, loss: 0.00000, lr: 0.299682, top1: 0.05520, throughput: 468.99 | 2022-04-11 01:03:22.642 [rank:6] [eval], epoch: 0/50, iter: 125/125, loss: 0.00000, lr: 0.299682, top1: 0.05440, throughput: 468.79 | 2022-04-11 01:03:22.643 [rank:2] [eval], epoch: 0/50, iter: 125/125, loss: 0.00000, lr: 0.299682, top1: 0.05856, throughput: 469.13 | 2022-04-11 01:03:22.643 [rank:7] [eval], epoch: 0/50, iter: 125/125, loss: 0.00000, lr: 0.299682, top1: 0.05552, throughput: 469.18 | 2022-04-11 01:03:22.644 [rank:3] [eval], epoch: 0/50, iter: 125/125, loss: 0.00000, lr: 0.299682, top1: 0.05264, throughput: 465.50 | 2022-04-11 01:03:22.748 [rank:6] [train], epoch: 1/50, iter: 100/834, loss: 0.70346, lr: 0.335615, top1: 0.07479, throughput: 313.57 | 2022-04-11 01:04:23.873 [rank:5] [train], epoch: 1/50, iter: 100/834, loss: 0.70350, lr: 0.335615, top1: 0.07641, throughput: 313.43 | 2022-04-11 01:04:23.901 [rank:4] [train], epoch: 1/50, iter: 100/834, loss: 0.70351, lr: 0.335615, top1: 0.07370, throughput: 313.28 | 2022-04-11 01:04:23.912 [rank:2] [train], epoch: 1/50, iter: 100/834, loss: 0.70179, lr: 0.335615, top1: 0.07505, throughput: 313.29 | 2022-04-11 01:04:23.928 [rank:7] [train], epoch: 1/50, iter: 100/834, loss: 0.70350, lr: 0.335615, top1: 0.07927, throughput: 313.27 | 2022-04-11 01:04:23.933 [rank:1] [train], epoch: 1/50, iter: 100/834, loss: 0.70475, lr: 0.335615, top1: 0.07245, throughput: 313.09 | 2022-04-11 01:04:23.942 [rank:0] [train], epoch: 1/50, iter: 100/834, loss: 0.70103, lr: 0.335615, top1: 0.07427, throughput: 313.10 | 2022-04-11 01:04:23.943 [rank:3] [train], epoch: 1/50, iter: 100/834, loss: 0.70283, lr: 0.335615, top1: 0.07531, throughput: 313.75 | 2022-04-11 01:04:23.944 [rank:2] [train], epoch: 1/50, iter: 200/834, loss: 0.68400, lr: 0.371549, top1: 0.09021, throughput: 312.40 | 2022-04-11 01:05:25.388 [rank:4] [train], epoch: 1/50, iter: 200/834, loss: 0.68490, lr: 0.371549, top1: 0.08807, throughput: 312.32 | 2022-04-11 01:05:25.388 [rank:0] [train], epoch: 1/50, iter: 200/834, loss: 0.68602, lr: 0.371549, top1: 0.08901, throughput: 312.44 | 2022-04-11 01:05:25.396 [rank:1] [train], epoch: 1/50, iter: 200/834, loss: 0.68656, lr: 0.371549, top1: 0.09031, throughput: 312.39 | 2022-04-11 01:05:25.402 [rank:3] [train], epoch: 1/50, iter: 200/834, loss: 0.68836, lr: 0.371549, top1: 0.09182, throughput: 312.25 | 2022-04-11 01:05:25.433 [rank:6] [train], epoch: 1/50, iter: 200/834, loss: 0.68803, lr: 0.371549, top1: 0.08865, throughput: 311.81 | 2022-04-11 01:05:25.448 [rank:7] [train], epoch: 1/50, iter: 200/834, loss: 0.68705, lr: 0.371549, top1: 0.09005, throughput: 312.07 | 2022-04-11 01:05:25.457 [rank:5] [train], epoch: 1/50, iter: 200/834, loss: 0.68649, lr: 0.371549, top1: 0.09182, throughput: 311.79 | 2022-04-11 01:05:25.481 [rank:1] [train], epoch: 1/50, iter: 300/834, loss: 0.67133, lr: 0.407482, top1: 0.09974, throughput: 312.56 | 2022-04-11 01:06:26.831 [rank:4] [train], epoch: 1/50, iter: 300/834, loss: 0.67108, lr: 0.407482, top1: 0.10349, throughput: 312.47 | 2022-04-11 01:06:26.834 [rank:3] [train], epoch: 1/50, iter: 300/834, loss: 0.67127, lr: 0.407482, top1: 0.10854, throughput: 312.65 | 2022-04-11 01:06:26.844 [rank:7] [train], epoch: 1/50, iter: 300/834, loss: 0.67062, lr: 0.407482, top1: 0.10505, throughput: 312.61 | 2022-04-11 01:06:26.876 [rank:0] [train], epoch: 1/50, iter: 300/834, loss: 0.67192, lr: 0.407482, top1: 0.10406, throughput: 312.27 | 2022-04-11 01:06:26.881 [rank:6] [train], epoch: 1/50, iter: 300/834, loss: 0.67183, lr: 0.407482, top1: 0.10187, throughput: 312.53 | 2022-04-11 01:06:26.883 [rank:5] [train], epoch: 1/50, iter: 300/834, loss: 0.67132, lr: 0.407482, top1: 0.10333, throughput: 312.66 | 2022-04-11 01:06:26.889 [rank:2] [train], epoch: 1/50, iter: 300/834, loss: 0.67080, lr: 0.407482, top1: 0.10625, throughput: 312.14 | 2022-04-11 01:06:26.900 [rank:7] [train], epoch: 1/50, iter: 400/834, loss: 0.65625, lr: 0.443415, top1: 0.11547, throughput: 311.67 | 2022-04-11 01:07:28.479 [rank:4] [train], epoch: 1/50, iter: 400/834, loss: 0.65713, lr: 0.443415, top1: 0.11859, throughput: 311.02 | 2022-04-11 01:07:28.566 [rank:1] [train], epoch: 1/50, iter: 400/834, loss: 0.65463, lr: 0.443415, top1: 0.11708, throughput: 311.00 | 2022-04-11 01:07:28.567 [rank:0] [train], epoch: 1/50, iter: 400/834, loss: 0.65470, lr: 0.443415, top1: 0.11922, throughput: 311.22 | 2022-04-11 01:07:28.573 [rank:6] [train], epoch: 1/50, iter: 400/834, loss: 0.65608, lr: 0.443415, top1: 0.12052, throughput: 311.16 | 2022-04-11 01:07:28.588 [rank:2] [train], epoch: 1/50, iter: 400/834, loss: 0.65569, lr: 0.443415, top1: 0.11547, throughput: 311.20 | 2022-04-11 01:07:28.595 [rank:3] [train], epoch: 1/50, iter: 400/834, loss: 0.65705, lr: 0.443415, top1: 0.11745, throughput: 310.89 | 2022-04-11 01:07:28.603 [rank:5] [train], epoch: 1/50, iter: 400/834, loss: 0.65450, lr: 0.443415, top1: 0.11990, throughput: 310.98 | 2022-04-11 01:07:28.629 [rank:6] [train], epoch: 1/50, iter: 500/834, loss: 0.64133, lr: 0.479348, top1: 0.13146, throughput: 311.51 | 2022-04-11 01:08:30.224 [rank:0] [train], epoch: 1/50, iter: 500/834, loss: 0.64256, lr: 0.479348, top1: 0.13255, throughput: 311.42 | 2022-04-11 01:08:30.225 [rank:2] [train], epoch: 1/50, iter: 500/834, loss: 0.64244, lr: 0.479348, top1: 0.13172, throughput: 311.49 | 2022-04-11 01:08:30.234 [rank:1] [train], epoch: 1/50, iter: 500/834, loss: 0.64060, lr: 0.479348, top1: 0.13276, throughput: 311.19 | 2022-04-11 01:08:30.265 [rank:7] [train], epoch: 1/50, iter: 500/834, loss: 0.64302, lr: 0.479348, top1: 0.12922, throughput: 310.70 | 2022-04-11 01:08:30.274 [rank:5] [train], epoch: 1/50, iter: 500/834, loss: 0.63864, lr: 0.479348, top1: 0.13667, throughput: 311.46 | 2022-04-11 01:08:30.274 [rank:4] [train], epoch: 1/50, iter: 500/834, loss: 0.64028, lr: 0.479348, top1: 0.13516, throughput: 311.07 | 2022-04-11 01:08:30.288 [rank:3] [train], epoch: 1/50, iter: 500/834, loss: 0.63996, lr: 0.479348, top1: 0.13167, throughput: 311.25 | 2022-04-11 01:08:30.289 [rank:5] [train], epoch: 1/50, iter: 600/834, loss: 0.62444, lr: 0.515281, top1: 0.15042, throughput: 313.52 | 2022-04-11 01:09:31.514 [rank:4] [train], epoch: 1/50, iter: 600/834, loss: 0.62524, lr: 0.515281, top1: 0.14812, throughput: 313.37 | 2022-04-11 01:09:31.558 [rank:7] [train], epoch: 1/50, iter: 600/834, loss: 0.62504, lr: 0.515281, top1: 0.15109, throughput: 313.24 | 2022-04-11 01:09:31.570 [rank:2] [train], epoch: 1/50, iter: 600/834, loss: 0.62605, lr: 0.515281, top1: 0.14677, throughput: 312.87 | 2022-04-11 01:09:31.602 [rank:3] [train], epoch: 1/50, iter: 600/834, loss: 0.62416, lr: 0.515281, top1: 0.15198, throughput: 313.07 | 2022-04-11 01:09:31.616 [rank:1] [train], epoch: 1/50, iter: 600/834, loss: 0.62533, lr: 0.515281, top1: 0.15307, throughput: 312.92 | 2022-04-11 01:09:31.623 [rank:6] [train], epoch: 1/50, iter: 600/834, loss: 0.62419, lr: 0.515281, top1: 0.14990, throughput: 312.59 | 2022-04-11 01:09:31.647 [rank:0] [train], epoch: 1/50, iter: 600/834, loss: 0.62538, lr: 0.515281, top1: 0.15177, throughput: 312.56 | 2022-04-11 01:09:31.654 [rank:2] [train], epoch: 1/50, iter: 700/834, loss: 0.61061, lr: 0.551214, top1: 0.16401, throughput: 312.40 | 2022-04-11 01:10:33.061 [rank:0] [train], epoch: 1/50, iter: 700/834, loss: 0.61097, lr: 0.551214, top1: 0.16526, throughput: 312.60 | 2022-04-11 01:10:33.075 [rank:7] [train], epoch: 1/50, iter: 700/834, loss: 0.61479, lr: 0.551214, top1: 0.16411, throughput: 312.13 | 2022-04-11 01:10:33.083 [rank:1] [train], epoch: 1/50, iter: 700/834, loss: 0.61144, lr: 0.551214, top1: 0.16234, throughput: 312.35 | 2022-04-11 01:10:33.093 [rank:4] [train], epoch: 1/50, iter: 700/834, loss: 0.61300, lr: 0.551214, top1: 0.16396, throughput: 312.01 | 2022-04-11 01:10:33.095 [rank:5] [train], epoch: 1/50, iter: 700/834, loss: 0.61338, lr: 0.551214, top1: 0.16047, throughput: 311.78 | 2022-04-11 01:10:33.096 [rank:6] [train], epoch: 1/50, iter: 700/834, loss: 0.61321, lr: 0.551214, top1: 0.16380, throughput: 312.24 | 2022-04-11 01:10:33.139 [rank:3] [train], epoch: 1/50, iter: 700/834, loss: 0.61138, lr: 0.551214, top1: 0.16203, throughput: 312.48 | 2022-04-11 01:10:33.060 [rank:1] [train], epoch: 1/50, iter: 800/834, loss: 0.59505, lr: 0.587147, top1: 0.18516, throughput: 312.11 | 2022-04-11 01:11:34.609 [rank:2] [train], epoch: 1/50, iter: 800/834, loss: 0.59800, lr: 0.587147, top1: 0.17854, throughput: 311.81 | 2022-04-11 01:11:34.637 [rank:5] [train], epoch: 1/50, iter: 800/834, loss: 0.59821, lr: 0.587147, top1: 0.17630, throughput: 311.86 | 2022-04-11 01:11:34.661 [rank:3] [train], epoch: 1/50, iter: 800/834, loss: 0.59484, lr: 0.587147, top1: 0.18250, throughput: 311.64 | 2022-04-11 01:11:34.668 [rank:4] [train], epoch: 1/50, iter: 800/834, loss: 0.59964, lr: 0.587147, top1: 0.17464, throughput: 311.80 | 2022-04-11 01:11:34.672 [rank:7] [train], epoch: 1/50, iter: 800/834, loss: 0.59705, lr: 0.587147, top1: 0.18047, throughput: 311.72 | 2022-04-11 01:11:34.677 [rank:6] [train], epoch: 1/50, iter: 800/834, loss: 0.59755, lr: 0.587147, top1: 0.18073, throughput: 311.80 | 2022-04-11 01:11:34.717 [rank:0] [train], epoch: 1/50, iter: 800/834, loss: 0.59609, lr: 0.587147, top1: 0.18000, throughput: 311.94 | 2022-04-11 01:11:34.625 [rank:4] [train], epoch: 1/50, iter: 834/834, loss: 0.59195, lr: 0.599365, top1: 0.18796, throughput: 312.81 | 2022-04-11 01:11:55.541 [rank:5] [train], epoch: 1/50, iter: 834/834, loss: 0.59389, lr: 0.599365, top1: 0.17892, throughput: 312.53 | 2022-04-11 01:11:55.549 [rank:6] [train], epoch: 1/50, iter: 834/834, loss: 0.58811, lr: 0.599365, top1: 0.19010, throughput: 313.36 | 2022-04-11 01:11:55.549 [rank:7] [train], epoch: 1/50, iter: 834/834, loss: 0.58823, lr: 0.599365, top1: 0.18873, throughput: 312.75 | 2022-04-11 01:11:55.549 [rank:2] [train], epoch: 1/50, iter: 834/834, loss: 0.58619, lr: 0.599365, top1: 0.19072, throughput: 312.11 | 2022-04-11 01:11:55.552 [rank:0] [train], epoch: 1/50, iter: 834/834, loss: 0.58478, lr: 0.599365, top1: 0.18919, throughput: 311.89 | 2022-04-11 01:11:55.556 [rank:1] [train], epoch: 1/50, iter: 834/834, loss: 0.58678, lr: 0.599365, top1: 0.19271, throughput: 311.61 | 2022-04-11 01:11:55.558 [rank:3] [train], epoch: 1/50, iter: 834/834, loss: 0.58555, lr: 0.599365, top1: 0.19531, throughput: 312.28 | 2022-04-11 01:11:55.573 [rank:0] [eval], epoch: 1/50, iter: 125/125, loss: 0.00000, lr: 0.599365, top1: 0.14224, throughput: 481.46 | 2022-04-11 01:12:08.537 [rank:1] [eval], epoch: 1/50, iter: 125/125, loss: 0.00000, lr: 0.599365, top1: 0.14544, throughput: 481.30 | 2022-04-11 01:12:08.544 [rank:4] [eval], epoch: 1/50, iter: 125/125, loss: 0.00000, lr: 0.599365, top1: 0.14096, throughput: 480.48 | 2022-04-11 01:12:08.548 [rank:7] [eval], epoch: 1/50, iter: 125/125, loss: 0.00000, lr: 0.599365, top1: 0.14784, throughput: 480.77 | 2022-04-11 01:12:08.549 [rank:2] [eval], epoch: 1/50, iter: 125/125, loss: 0.00000, lr: 0.599365, top1: 0.15248, throughput: 480.80 | 2022-04-11 01:12:08.551 [rank:5] [eval], epoch: 1/50, iter: 125/125, loss: 0.00000, lr: 0.599365, top1: 0.14000, throughput: 480.66 | 2022-04-11 01:12:08.552 [rank:6] [eval], epoch: 1/50, iter: 125/125, loss: 0.00000, lr: 0.599365, top1: 0.14704, throughput: 480.59 | 2022-04-11 01:12:08.554 [rank:3] [eval], epoch: 1/50, iter: 125/125, loss: 0.00000, lr: 0.599365, top1: 0.13984, throughput: 479.89 | 2022-04-11 01:12:08.596 [rank:1] [train], epoch: 2/50, iter: 100/834, loss: 0.57961, lr: 0.635298, top1: 0.19958, throughput: 312.38 | 2022-04-11 01:13:10.007 [rank:2] [train], epoch: 2/50, iter: 100/834, loss: 0.58073, lr: 0.635298, top1: 0.20307, throughput: 312.19 | 2022-04-11 01:13:10.052 [rank:3] [train], epoch: 2/50, iter: 100/834, loss: 0.58153, lr: 0.635298, top1: 0.20229, throughput: 312.38 | 2022-04-11 01:13:10.060 [rank:6] [train], epoch: 2/50, iter: 100/834, loss: 0.57690, lr: 0.635298, top1: 0.20458, throughput: 312.13 | 2022-04-11 01:13:10.067 [rank:0] [train], epoch: 2/50, iter: 100/834, loss: 0.57911, lr: 0.635298, top1: 0.20646, throughput: 311.94 | 2022-04-11 01:13:10.088 [rank:4] [train], epoch: 2/50, iter: 100/834, loss: 0.57817, lr: 0.635298, top1: 0.20193, throughput: 311.94 | 2022-04-11 01:13:10.098 [rank:5] [train], epoch: 2/50, iter: 100/834, loss: 0.57898, lr: 0.635298, top1: 0.20203, throughput: 311.96 | 2022-04-11 01:13:10.099 [rank:7] [train], epoch: 2/50, iter: 100/834, loss: 0.57729, lr: 0.635298, top1: 0.20531, throughput: 311.83 | 2022-04-11 01:13:10.122 [rank:2] [train], epoch: 2/50, iter: 200/834, loss: 0.57044, lr: 0.671231, top1: 0.21766, throughput: 310.71 | 2022-04-11 01:14:11.846 [rank:4] [train], epoch: 2/50, iter: 200/834, loss: 0.56946, lr: 0.671231, top1: 0.21589, throughput: 310.93 | 2022-04-11 01:14:11.848 [rank:1] [train], epoch: 2/50, iter: 200/834, loss: 0.56886, lr: 0.671231, top1: 0.21667, throughput: 310.38 | 2022-04-11 01:14:11.866 [rank:5] [train], epoch: 2/50, iter: 200/834, loss: 0.56523, lr: 0.671231, top1: 0.22375, throughput: 310.82 | 2022-04-11 01:14:11.871 [rank:3] [train], epoch: 2/50, iter: 200/834, loss: 0.56950, lr: 0.671231, top1: 0.21474, throughput: 310.50 | 2022-04-11 01:14:11.895 [rank:0] [train], epoch: 2/50, iter: 200/834, loss: 0.57033, lr: 0.671231, top1: 0.21208, throughput: 310.60 | 2022-04-11 01:14:11.903 [rank:6] [train], epoch: 2/50, iter: 200/834, loss: 0.56768, lr: 0.671231, top1: 0.21630, throughput: 310.50 | 2022-04-11 01:14:11.904 [rank:7] [train], epoch: 2/50, iter: 200/834, loss: 0.57046, lr: 0.671231, top1: 0.21547, throughput: 310.70 | 2022-04-11 01:14:11.917 [rank:4] [train], epoch: 2/50, iter: 300/834, loss: 0.55997, lr: 0.707164, top1: 0.23208, throughput: 313.50 | 2022-04-11 01:15:13.093 [rank:0] [train], epoch: 2/50, iter: 300/834, loss: 0.55826, lr: 0.707164, top1: 0.22922, throughput: 313.49 | 2022-04-11 01:15:13.149 [rank:6] [train], epoch: 2/50, iter: 300/834, loss: 0.56006, lr: 0.707164, top1: 0.22771, throughput: 313.44 | 2022-04-11 01:15:13.159 [rank:5] [train], epoch: 2/50, iter: 300/834, loss: 0.55875, lr: 0.707164, top1: 0.23172, throughput: 313.25 | 2022-04-11 01:15:13.165 [rank:3] [train], epoch: 2/50, iter: 300/834, loss: 0.55654, lr: 0.707164, top1: 0.23495, throughput: 313.19 | 2022-04-11 01:15:13.200 [rank:2] [train], epoch: 2/50, iter: 300/834, loss: 0.55855, lr: 0.707164, top1: 0.23193, throughput: 312.91 | 2022-04-11 01:15:13.205 [rank:7] [train], epoch: 2/50, iter: 300/834, loss: 0.55925, lr: 0.707164, top1: 0.22927, throughput: 313.24 | 2022-04-11 01:15:13.212 [rank:1] [train], epoch: 2/50, iter: 300/834, loss: 0.55735, lr: 0.707164, top1: 0.23010, throughput: 313.37 | 2022-04-11 01:15:13.136 [rank:1] [train], epoch: 2/50, iter: 400/834, loss: 0.54876, lr: 0.743097, top1: 0.24260, throughput: 311.42 | 2022-04-11 01:16:14.789 [rank:6] [train], epoch: 2/50, iter: 400/834, loss: 0.54780, lr: 0.743097, top1: 0.24568, throughput: 311.51 | 2022-04-11 01:16:14.795 [rank:7] [train], epoch: 2/50, iter: 400/834, loss: 0.54850, lr: 0.743097, top1: 0.23932, throughput: 311.77 | 2022-04-11 01:16:14.795 [rank:4] [train], epoch: 2/50, iter: 400/834, loss: 0.54687, lr: 0.743097, top1: 0.24797, throughput: 311.08 | 2022-04-11 01:16:14.814 [rank:5] [train], epoch: 2/50, iter: 400/834, loss: 0.54797, lr: 0.743097, top1: 0.24187, throughput: 311.43 | 2022-04-11 01:16:14.816 [rank:0] [train], epoch: 2/50, iter: 400/834, loss: 0.54894, lr: 0.743097, top1: 0.24865, throughput: 311.27 [rank:2] [train], epoch: 2/50, iter: 400/834, loss: 0.54888, lr: 0.743097, top1: 0.24427, throughput: 311.56| 2022-04-11 01:16:14.831 | 2022-04-11 01:16:14.831 [rank:3] [train], epoch: 2/50, iter: 400/834, loss: 0.54763, lr: 0.743097, top1: 0.24474, throughput: 311.53 | 2022-04-11 01:16:14.832 [rank:5] [train], epoch: 2/50, iter: 500/834, loss: 0.53703, lr: 0.779030, top1: 0.26161, throughput: 311.83 | 2022-04-11 01:17:16.387 [rank:0] [train], epoch: 2/50, iter: 500/834, loss: 0.54063, lr: 0.779030, top1: 0.25417, throughput: 311.65 | 2022-04-11 01:17:16.439 [rank:6] [train], epoch: 2/50, iter: 500/834, loss: 0.53672, lr: 0.779030, top1: 0.26042, throughput: 311.40 | 2022-04-11 01:17:16.453 [rank:7] [train], epoch: 2/50, iter: 500/834, loss: 0.53984, lr: 0.779030, top1: 0.25651, throughput: 311.23 | 2022-04-11 01:17:16.486 [rank:1] [train], epoch: 2/50, iter: 500/834, loss: 0.54070, lr: 0.779030, top1: 0.25323, throughput: 311.09 | 2022-04-11 01:17:16.507 [rank:4] [train], epoch: 2/50, iter: 500/834, loss: 0.53712, lr: 0.779030, top1: 0.25453, throughput: 311.21 | 2022-04-11 01:17:16.509 [rank:2] [train], epoch: 2/50, iter: 500/834, loss: 0.54140, lr: 0.779030, top1: 0.25036, throughput: 311.26 | 2022-04-11 01:17:16.517 [rank:3] [train], epoch: 2/50, iter: 500/834, loss: 0.53916, lr: 0.779030, top1: 0.25474, throughput: 311.22 | 2022-04-11 01:17:16.525 [rank:6] [train], epoch: 2/50, iter: 600/834, loss: 0.53627, lr: 0.814963, top1: 0.25922, throughput: 314.07 | 2022-04-11 01:18:17.586 [rank:5] [train], epoch: 2/50, iter: 600/834, loss: 0.53018, lr: 0.814963, top1: 0.27062, throughput: 313.53 | 2022-04-11 01:18:17.626 [rank:1] [train], epoch: 2/50, iter: 600/834, loss: 0.53276, lr: 0.814963, top1: 0.26417, throughput: 314.14 | 2022-04-11 01:18:17.627 [rank:2] [train], epoch: 2/50, iter: 600/834, loss: 0.52820, lr: 0.814963, top1: 0.26844, throughput: 314.18 | 2022-04-11 01:18:17.628 [rank:7] [train], epoch: 2/50, iter: 600/834, loss: 0.53101, lr: 0.814963, top1: 0.26917, throughput: 313.91 | 2022-04-11 01:18:17.651 [rank:4] [train], epoch: 2/50, iter: 600/834, loss: 0.52897, lr: 0.814963, top1: 0.27427, throughput: 313.88 | 2022-04-11 01:18:17.679 [rank:3] [train], epoch: 2/50, iter: 600/834, loss: 0.52957, lr: 0.814963, top1: 0.26990, throughput: 313.92 | 2022-04-11 01:18:17.688 [rank:0] [train], epoch: 2/50, iter: 600/834, loss: 0.53123, lr: 0.814963, top1: 0.27047, throughput: 313.43 | 2022-04-11 01:18:17.697 [rank:6] [train], epoch: 2/50, iter: 700/834, loss: 0.52353, lr: 0.850896, top1: 0.27531, throughput: 313.19 | 2022-04-11 01:19:18.891 [rank:5] [train], epoch: 2/50, iter: 700/834, loss: 0.52059, lr: 0.850896, top1: 0.28354, throughput: 313.35 | 2022-04-11 01:19:18.899 [rank:3] [train], epoch: 2/50, iter: 700/834, loss: 0.51844, lr: 0.850896, top1: 0.28583, throughput: 313.57 | 2022-04-11 01:19:18.918 [rank:7] [train], epoch: 2/50, iter: 700/834, loss: 0.52199, lr: 0.850896, top1: 0.27875, throughput: 313.25 | 2022-04-11 01:19:18.943 [rank:2] [train], epoch: 2/50, iter: 700/834, loss: 0.52055, lr: 0.850896, top1: 0.28109, throughput: 313.10 | 2022-04-11 01:19:18.951 [rank:1] [train], epoch: 2/50, iter: 700/834, loss: 0.52027, lr: 0.850896, top1: 0.28292, throughput: 313.09 | 2022-04-11 01:19:18.951 [rank:4] [train], epoch: 2/50, iter: 700/834, loss: 0.52029, lr: 0.850896, top1: 0.28365, throughput: 313.69 | 2022-04-11 01:19:18.885 [rank:0] [train], epoch: 2/50, iter: 700/834, loss: 0.52211, lr: 0.850896, top1: 0.28052, throughput: 313.31 | 2022-04-11 01:19:18.979 [rank:0] [train], epoch: 2/50, iter: 800/834, loss: 0.51588, lr: 0.886830, top1: 0.29427, throughput: 311.81 | 2022-04-11 01:20:20.554 [rank:3] [train], epoch: 2/50, iter: 800/834, loss: 0.51592, lr: 0.886830, top1: 0.28474, throughput: 311.48 | 2022-04-11 01:20:20.559 [rank:1] [train], epoch: 2/50, iter: 800/834, loss: 0.51539, lr: 0.886830, top1: 0.29130, throughput: 311.64 | 2022-04-11 01:20:20.562 [rank:5] [train], epoch: 2/50, iter: 800/834, loss: 0.51559, lr: 0.886830, top1: 0.28688, throughput: 311.37 | 2022-04-11 01:20:20.562 [rank:6] [train], epoch: 2/50, iter: 800/834, loss: 0.51514, lr: 0.886830, top1: 0.28781, throughput: 311.30 | 2022-04-11 01:20:20.568 [rank:4] [train], epoch: 2/50, iter: 800/834, loss: 0.51260, lr: 0.886830, top1: 0.29542, throughput: 311.26 | 2022-04-11 01:20:20.570 [rank:7] [train], epoch: 2/50, iter: 800/834, loss: 0.51652, lr: 0.886830, top1: 0.29255, throughput: 311.51 | 2022-04-11 01:20:20.578 [rank:2] [train], epoch: 2/50, iter: 800/834, loss: 0.51651, lr: 0.886830, top1: 0.29021, throughput: 311.53 | 2022-04-11 01:20:20.583 [rank:6] [train], epoch: 2/50, iter: 834/834, loss: 0.51294, lr: 0.899047, top1: 0.29350, throughput: 314.14 | 2022-04-11 01:20:41.349 [rank:7] [train], epoch: 2/50, iter: 834/834, loss: 0.51092, lr: 0.899047, top1: 0.30162, throughput: 314.20 | 2022-04-11 01:20:41.355 [rank:4] [train], epoch: 2/50, iter: 834/834, loss: 0.50814, lr: 0.899047, top1: 0.30806, throughput: 314.06 | 2022-04-11 01:20:41.355 [rank:2] [train], epoch: 2/50, iter: 834/834, loss: 0.50923, lr: 0.899047, top1: 0.29948, throughput: 314.25 | 2022-04-11 01:20:41.356 [rank:1] [train], epoch: 2/50, iter: 834/834, loss: 0.50918, lr: 0.899047, top1: 0.30239, throughput: 313.84 | 2022-04-11 01:20:41.362 [rank:5] [train], epoch: 2/50, iter: 834/834, loss: 0.50924, lr: 0.899047, top1: 0.30270, throughput: 313.75 | 2022-04-11 01:20:41.368 [rank:0] [train], epoch: 2/50, iter: 834/834, loss: 0.50645, lr: 0.899047, top1: 0.30714, throughput: 313.56 | 2022-04-11 01:20:41.373 [rank:3] [train], epoch: 2/50, iter: 834/834, loss: 0.50921, lr: 0.899047, top1: 0.30009, throughput: 313.61 | 2022-04-11 01:20:41.375 [rank:0] [eval], epoch: 2/50, iter: 125/125, loss: 0.00000, lr: 0.899047, top1: 0.26640, throughput: 485.95 | 2022-04-11 01:20:54.235 [rank:7] [eval], epoch: 2/50, iter: 125/125, loss: 0.00000, lr: 0.899047, top1: 0.26464, throughput: 485.01 | 2022-04-11 01:20:54.241 [rank:6] [eval], epoch: 2/50, iter: 125/125, loss: 0.00000, lr: 0.899047, top1: 0.26352, throughput: 484.68 | 2022-04-11 01:20:54.244 [rank:4] [eval], epoch: 2/50, iter: 125/125, loss: 0.00000, lr: 0.899047, top1: 0.25808, throughput: 484.81 | 2022-04-11 01:20:54.247 [rank:2] [eval], epoch: 2/50, iter: 125/125, loss: 0.00000, lr: 0.899047, top1: 0.26592, throughput: 484.82 | 2022-04-11 01:20:54.248 [rank:1] [eval], epoch: 2/50, iter: 125/125, loss: 0.00000, lr: 0.899047, top1: 0.27152, throughput: 484.59 | 2022-04-11 01:20:54.260 [rank:5] [eval], epoch: 2/50, iter: 125/125, loss: 0.00000, lr: 0.899047, top1: 0.24784, throughput: 484.62 | 2022-04-11 01:20:54.265 [rank:3] [eval], epoch: 2/50, iter: 125/125, loss: 0.00000, lr: 0.899047, top1: 0.25568, throughput: 484.62 | 2022-04-11 01:20:54.271 [rank:6] [train], epoch: 3/50, iter: 100/834, loss: 0.49935, lr: 0.934980, top1: 0.31599, throughput: 313.47 | 2022-04-11 01:21:55.495 [rank:7] [train], epoch: 3/50, iter: 100/834, loss: 0.49984, lr: 0.934980, top1: 0.30953, throughput: 313.40 | 2022-04-11 01:21:55.505 [rank:4] [train], epoch: 3/50, iter: 100/834, loss: 0.50288, lr: 0.934980, top1: 0.30693, throughput: 313.36 | 2022-04-11 01:21:55.519 [rank:1] [train], epoch: 3/50, iter: 100/834, loss: 0.50116, lr: 0.934980, top1: 0.30891, throughput: 313.35 | 2022-04-11 01:21:55.533 [rank:3] [train], epoch: 3/50, iter: 100/834, loss: 0.49857, lr: 0.934980, top1: 0.31839, throughput: 313.36 | 2022-04-11 01:21:55.542 [rank:2] [train], epoch: 3/50, iter: 100/834, loss: 0.50319, lr: 0.934980, top1: 0.31000, throughput: 313.18 | 2022-04-11 01:21:55.555 [rank:5] [train], epoch: 3/50, iter: 100/834, loss: 0.50072, lr: 0.934980, top1: 0.31594, throughput: 313.23 | 2022-04-11 01:21:55.562 [rank:0] [train], epoch: 3/50, iter: 100/834, loss: 0.49822, lr: 0.934980, top1: 0.31255, throughput: 313.47 | 2022-04-11 01:21:55.485 [rank:5] [train], epoch: 3/50, iter: 200/834, loss: 0.49750, lr: 0.970913, top1: 0.31589, throughput: 313.43 | 2022-04-11 01:22:56.820 [rank:6] [train], epoch: 3/50, iter: 200/834, loss: 0.49534, lr: 0.970913, top1: 0.32297, throughput: 313.07 | 2022-04-11 01:22:56.824 [rank:0] [train], epoch: 3/50, iter: 200/834, loss: 0.49518, lr: 0.970913, top1: 0.32078, throughput: 312.94 | 2022-04-11 01:22:56.838 [rank:4] [train], epoch: 3/50, iter: 200/834, loss: 0.49622, lr: 0.970913, top1: 0.31401, throughput: 313.11 | 2022-04-11 01:22:56.840 [rank:7] [train], epoch: 3/50, iter: 200/834, loss: 0.49777, lr: 0.970913, top1: 0.31724, throughput: 312.94 | 2022-04-11 01:22:56.858 [rank:2] [train], epoch: 3/50, iter: 200/834, loss: 0.49663, lr: 0.970913, top1: 0.31630, throughput: 313.16 | 2022-04-11 01:22:56.865 [rank:3] [train], epoch: 3/50, iter: 200/834, loss: 0.49627, lr: 0.970913, top1: 0.31865, throughput: 313.01 | 2022-04-11 01:22:56.881 [rank:1] [train], epoch: 3/50, iter: 200/834, loss: 0.49366, lr: 0.970913, top1: 0.31880, throughput: 312.85 | 2022-04-11 01:22:56.903 [rank:4] [train], epoch: 3/50, iter: 300/834, loss: 0.48850, lr: 1.006846, top1: 0.33474, throughput: 311.75 | 2022-04-11 01:23:58.428 [rank:0] [train], epoch: 3/50, iter: 300/834, loss: 0.49224, lr: 1.006846, top1: 0.32458, throughput: 311.69 | 2022-04-11 01:23:58.438 [rank:6] [train], epoch: 3/50, iter: 300/834, loss: 0.49149, lr: 1.006846, top1: 0.32573, throughput: 311.46 | 2022-04-11 01:23:58.469 [rank:1] [train], epoch: 3/50, iter: 300/834, loss: 0.49001, lr: 1.006846, top1: 0.32823, throughput: 311.80 | 2022-04-11 01:23:58.482 [rank:5] [train], epoch: 3/50, iter: 300/834, loss: 0.49144, lr: 1.006846, top1: 0.32526, throughput: 311.36 | 2022-04-11 01:23:58.485 [rank:3] [train], epoch: 3/50, iter: 300/834, loss: 0.49022, lr: 1.006846, top1: 0.32812, throughput: 311.60 | 2022-04-11 01:23:58.499 [rank:7] [train], epoch: 3/50, iter: 300/834, loss: 0.49166, lr: 1.006846, top1: 0.32771, throughput: 311.42 | 2022-04-11 01:23:58.512 [rank:2] [train], epoch: 3/50, iter: 300/834, loss: 0.48880, lr: 1.006846, top1: 0.32995, throughput: 311.37 | 2022-04-11 01:23:58.528 [rank:2] [train], epoch: 3/50, iter: 400/834, loss: 0.48679, lr: 1.042779, top1: 0.33365, throughput: 312.03 | 2022-04-11 01:25:00.060 [rank:5] [train], epoch: 3/50, iter: 400/834, loss: 0.48488, lr: 1.042779, top1: 0.33224, throughput: 311.73 | 2022-04-11 01:25:00.077 [rank:0] [train], epoch: 3/50, iter: 400/834, loss: 0.48331, lr: 1.042779, top1: 0.33807, throughput: 311.45 | 2022-04-11 01:25:00.085 [rank:6] [train], epoch: 3/50, iter: 400/834, loss: 0.48334, lr: 1.042779, top1: 0.34255, throughput: 311.56 | 2022-04-11 01:25:00.093 [rank:1] [train], epoch: 3/50, iter: 400/834, loss: 0.48460, lr: 1.042779, top1: 0.33937, throughput: 311.59 | 2022-04-11 01:25:00.101 [rank:7] [train], epoch: 3/50, iter: 400/834, loss: 0.48214, lr: 1.042779, top1: 0.34219, throughput: 311.71 | 2022-04-11 01:25:00.107 [rank:4] [train], epoch: 3/50, iter: 400/834, loss: 0.48626, lr: 1.042779, top1: 0.33406, throughput: 311.25 | 2022-04-11 01:25:00.115 [rank:3] [train], epoch: 3/50, iter: 400/834, loss: 0.48561, lr: 1.042779, top1: 0.33219, throughput: 311.57 | 2022-04-11 01:25:00.124 [rank:2] [train], epoch: 3/50, iter: 500/834, loss: 0.47920, lr: 1.078712, top1: 0.34464, throughput: 313.51 | 2022-04-11 01:26:01.302 [rank:3] [train], epoch: 3/50, iter: 500/834, loss: 0.47830, lr: 1.078712, top1: 0.35057, throughput: 313.83 | 2022-04-11 01:26:01.302 [rank:1] [train], epoch: 3/50, iter: 500/834, loss: 0.48034, lr: 1.078712, top1: 0.34604, throughput: 313.71 | 2022-04-11 01:26:01.303 [rank:6] [train], epoch: 3/50, iter: 500/834, loss: 0.48240, lr: 1.078712, top1: 0.34146, throughput: 313.57 | 2022-04-11 01:26:01.323 [rank:7] [train], epoch: 3/50, iter: 500/834, loss: 0.47850, lr: 1.078712, top1: 0.33974, throughput: 313.53 | 2022-04-11 01:26:01.345 [rank:4] [train], epoch: 3/50, iter: 500/834, loss: 0.47863, lr: 1.078712, top1: 0.34531, throughput: 313.56 | 2022-04-11 01:26:01.347 [rank:0] [train], epoch: 3/50, iter: 500/834, loss: 0.48249, lr: 1.078712, top1: 0.33802, throughput: 313.31 | 2022-04-11 01:26:01.365 [rank:5] [train], epoch: 3/50, iter: 500/834, loss: 0.47668, lr: 1.078712, top1: 0.34901, throughput: 313.14 | 2022-04-11 01:26:01.393 [rank:1] [train], epoch: 3/50, iter: 600/834, loss: 0.47535, lr: 1.114646, top1: 0.34927, throughput: 311.24 | 2022-04-11 01:27:02.993 [rank:7] [train], epoch: 3/50, iter: 600/834, loss: 0.47375, lr: 1.114646, top1: 0.35130, throughput: 311.43 | 2022-04-11 01:27:02.996 [rank:6] [train], epoch: 3/50, iter: 600/834, loss: 0.47415, lr: 1.114646, top1: 0.35297, throughput: 311.31 | 2022-04-11 01:27:02.998 [rank:5] [train], epoch: 3/50, iter: 600/834, loss: 0.47690, lr: 1.114646, top1: 0.35094, throughput: 311.66 | 2022-04-11 01:27:02.999 [rank:2] [train], epoch: 3/50, iter: 600/834, loss: 0.47457, lr: 1.114646, top1: 0.35047, throughput: 311.19 | 2022-04-11 01:27:03.000 [rank:0] [train], epoch: 3/50, iter: 600/834, loss: 0.47489, lr: 1.114646, top1: 0.35661, throughput: 311.50 | 2022-04-11 01:27:03.001 [rank:4] [train], epoch: 3/50, iter: 600/834, loss: 0.47738, lr: 1.114646, top1: 0.34849, throughput: 311.69 | 2022-04-11 01:27:02.948 [rank:3] [train], epoch: 3/50, iter: 600/834, loss: 0.47872, lr: 1.114646, top1: 0.34698, throughput: 310.97 | 2022-04-11 01:27:03.044 [rank:2] [train], epoch: 3/50, iter: 700/834, loss: 0.47304, lr: 1.150579, top1: 0.35604, throughput: 313.35 | 2022-04-11 01:28:04.273 [rank:4] [train], epoch: 3/50, iter: 700/834, loss: 0.47441, lr: 1.150579, top1: 0.35224, throughput: 312.87 | 2022-04-11 01:28:04.314 [rank:6] [train], epoch: 3/50, iter: 700/834, loss: 0.47082, lr: 1.150579, top1: 0.36042, throughput: 313.04 | 2022-04-11 01:28:04.332 [rank:7] [train], epoch: 3/50, iter: 700/834, loss: 0.46930, lr: 1.150579, top1: 0.35688, throughput: 313.01 | 2022-04-11 01:28:04.336 [rank:5] [train], epoch: 3/50, iter: 700/834, loss: 0.46847, lr: 1.150579, top1: 0.35964, throughput: 313.01 | 2022-04-11 01:28:04.339 [rank:0] [train], epoch: 3/50, iter: 700/834, loss: 0.47276, lr: 1.150579, top1: 0.35172, throughput: 312.87 | 2022-04-11 01:28:04.368 [rank:3] [train], epoch: 3/50, iter: 700/834, loss: 0.47019, lr: 1.150579, top1: 0.35557, throughput: 312.98 | 2022-04-11 01:28:04.391 [rank:1] [train], epoch: 3/50, iter: 700/834, loss: 0.47121, lr: 1.150579, top1: 0.35859, throughput: 312.60 | 2022-04-11 01:28:04.414 [rank:1] [train], epoch: 3/50, iter: 800/834, loss: 0.46673, lr: 1.186512, top1: 0.36750, throughput: 313.34 | 2022-04-11 01:29:05.689 [rank:5] [train], epoch: 3/50, iter: 800/834, loss: 0.46527, lr: 1.186512, top1: 0.37068, throughput: 312.76 | 2022-04-11 01:29:05.728 [rank:6] [train], epoch: 3/50, iter: 800/834, loss: 0.46747, lr: 1.186512, top1: 0.36224, throughput: 312.68 | 2022-04-11 01:29:05.737 [rank:2] [train], epoch: 3/50, iter: 800/834, loss: 0.46920, lr: 1.186512, top1: 0.36484, throughput: 312.34 | 2022-04-11 01:29:05.746 [rank:7] [train], epoch: 3/50, iter: 800/834, loss: 0.46910, lr: 1.186512, top1: 0.36047, throughput: 312.62 | 2022-04-11 01:29:05.753 [rank:4] [train], epoch: 3/50, iter: 800/834, loss: 0.46684, lr: 1.186512, top1: 0.36526, throughput: 312.42 | 2022-04-11 01:29:05.770 [rank:0] [train], epoch: 3/50, iter: 800/834, loss: 0.46866, lr: 1.186512, top1: 0.35990, throughput: 312.57 | 2022-04-11 01:29:05.794 [rank:3] [train], epoch: 3/50, iter: 800/834, loss: 0.46850, lr: 1.186512, top1: 0.36172, throughput: 312.62 | 2022-04-11 01:29:05.807 [rank:0] [train], epoch: 3/50, iter: 834/834, loss: 0.45877, lr: 1.198729, top1: 0.37316, throughput: 314.12 | 2022-04-11 01:29:26.576 [rank:5] [train], epoch: 3/50, iter: 834/834, loss: 0.45998, lr: 1.198729, top1: 0.37868, throughput: 312.80 | 2022-04-11 01:29:26.597 [rank:2] [train], epoch: 3/50, iter: 834/834, loss: 0.46075, lr: 1.198729, top1: 0.37975, throughput: 313.07 | 2022-04-11 01:29:26.597 [rank:4] [train], epoch: 3/50, iter: 834/834, loss: 0.46564, lr: 1.198729, top1: 0.36765, throughput: 313.27 | 2022-04-11 01:29:26.608 [rank:1] [train], epoch: 3/50, iter: 834/834, loss: 0.46566, lr: 1.198729, top1: 0.36903, throughput: 312.06 | 2022-04-11 01:29:26.609 [rank:6] [train], epoch: 3/50, iter: 834/834, loss: 0.46358, lr: 1.198729, top1: 0.36979, throughput: 312.69 | 2022-04-11 01:29:26.614 [rank:3] [train], epoch: 3/50, iter: 834/834, loss: 0.46201, lr: 1.198729, top1: 0.37531, throughput: 313.71 | 2022-04-11 01:29:26.616 [rank:7] [train], epoch: 3/50, iter: 834/834, loss: 0.46394, lr: 1.198729, top1: 0.37102, throughput: 312.83 | 2022-04-11 01:29:26.621 [rank:0] [eval], epoch: 3/50, iter: 125/125, loss: 0.00000, lr: 1.198729, top1: 0.35904, throughput: 485.31 | 2022-04-11 01:29:39.454 [rank:1] [eval], epoch: 3/50, iter: 125/125, loss: 0.00000, lr: 1.198729, top1: 0.35504, throughput: 486.28 | 2022-04-11 01:29:39.461 [rank:7] [eval], epoch: 3/50, iter: 125/125, loss: 0.00000, lr: 1.198729, top1: 0.35328, throughput: 486.54 | 2022-04-11 01:29:39.467 [rank:5] [eval], epoch: 3/50, iter: 125/125, loss: 0.00000, lr: 1.198729, top1: 0.34144, throughput: 485.51 | 2022-04-11 01:29:39.470 [rank:6] [eval], epoch: 3/50, iter: 125/125, loss: 0.00000, lr: 1.198729, top1: 0.34528, throughput: 486.11 | 2022-04-11 01:29:39.472 [rank:4] [eval], epoch: 3/50, iter: 125/125, loss: 0.00000, lr: 1.198729, top1: 0.35280, throughput: 485.86 | 2022-04-11 01:29:39.472 [rank:2] [eval], epoch: 3/50, iter: 125/125, loss: 0.00000, lr: 1.198729, top1: 0.35808, throughput: 485.24 | 2022-04-11 01:29:39.478 [rank:3] [eval], epoch: 3/50, iter: 125/125, loss: 0.00000, lr: 1.198729, top1: 0.34448, throughput: 484.68 | 2022-04-11 01:29:39.511 [rank:4] [train], epoch: 4/50, iter: 100/834, loss: 0.45752, lr: 1.234662, top1: 0.37880, throughput: 314.73 | 2022-04-11 01:30:40.477 [rank:6] [train], epoch: 4/50, iter: 100/834, loss: 0.46128, lr: 1.234662, top1: 0.37349, throughput: 314.72 | 2022-04-11 01:30:40.477 [rank:5] [train], epoch: 4/50, iter: 100/834, loss: 0.45505, lr: 1.234662, top1: 0.37844, throughput: 314.55 | 2022-04-11 01:30:40.509 [rank:3] [train], epoch: 4/50, iter: 100/834, loss: 0.45248, lr: 1.234662, top1: 0.39328, throughput: 314.70 | 2022-04-11 01:30:40.520 [rank:0] [train], epoch: 4/50, iter: 100/834, loss: 0.45531, lr: 1.234662, top1: 0.38583, throughput: 314.41 | 2022-04-11 01:30:40.522 [rank:2] [train], epoch: 4/50, iter: 100/834, loss: 0.45220, lr: 1.234662, top1: 0.38990, throughput: 314.43 | 2022-04-11 01:30:40.541 [rank:1] [train], epoch: 4/50, iter: 100/834, loss: 0.45643, lr: 1.234662, top1: 0.38307, throughput: 314.27 | 2022-04-11 01:30:40.556 [rank:7] [train], epoch: 4/50, iter: 100/834, loss: 0.45678, lr: 1.234662, top1: 0.38089, throughput: 314.68 | 2022-04-11 01:30:40.480 [rank:0] [train], epoch: 4/50, iter: 200/834, loss: 0.45252, lr: 1.270595, top1: 0.38578, throughput: 313.67 | 2022-04-11 01:31:41.732 [rank:6] [train], epoch: 4/50, iter: 200/834, loss: 0.45585, lr: 1.270595, top1: 0.37891, throughput: 313.31 | 2022-04-11 01:31:41.758 [rank:1] [train], epoch: 4/50, iter: 200/834, loss: 0.45740, lr: 1.270595, top1: 0.37667, throughput: 313.71 | 2022-04-11 01:31:41.759 [rank:3] [train], epoch: 4/50, iter: 200/834, loss: 0.45334, lr: 1.270595, top1: 0.38760, throughput: 313.41 | 2022-04-11 01:31:41.781 [rank:5] [train], epoch: 4/50, iter: 200/834, loss: 0.45604, lr: 1.270595, top1: 0.37990, throughput: 313.30 | 2022-04-11 01:31:41.792 [rank:2] [train], epoch: 4/50, iter: 200/834, loss: 0.45470, lr: 1.270595, top1: 0.38365, throughput: 313.46 | 2022-04-11 01:31:41.793 [rank:4] [train], epoch: 4/50, iter: 200/834, loss: 0.45534, lr: 1.270595, top1: 0.38172, throughput: 313.07 | 2022-04-11 01:31:41.805 [rank:7] [train], epoch: 4/50, iter: 200/834, loss: 0.45438, lr: 1.270595, top1: 0.38677, throughput: 313.09 | 2022-04-11 01:31:41.805 [rank:2] [train], epoch: 4/50, iter: 300/834, loss: 0.44940, lr: 1.306529, top1: 0.39047, throughput: 312.75 | 2022-04-11 01:32:43.184 [rank:5] [train], epoch: 4/50, iter: 300/834, loss: 0.45030, lr: 1.306529, top1: 0.38958, throughput: 312.52 | 2022-04-11 01:32:43.228 [rank:7] [train], epoch: 4/50, iter: 300/834, loss: 0.44863, lr: 1.306529, top1: 0.39318, throughput: 312.50 | 2022-04-11 01:32:43.245 [rank:6] [train], epoch: 4/50, iter: 300/834, loss: 0.44933, lr: 1.306529, top1: 0.39120, throughput: 312.25 | 2022-04-11 01:32:43.247 [rank:4] [train], epoch: 4/50, iter: 300/834, loss: 0.45074, lr: 1.306529, top1: 0.39057, throughput: 312.46 | 2022-04-11 01:32:43.252 [rank:3] [train], epoch: 4/50, iter: 300/834, loss: 0.45272, lr: 1.306529, top1: 0.39083, throughput: 312.30 | 2022-04-11 01:32:43.260 [rank:1] [train], epoch: 4/50, iter: 300/834, loss: 0.44843, lr: 1.306529, top1: 0.39458, throughput: 312.19 | 2022-04-11 01:32:43.261 [rank:0] [train], epoch: 4/50, iter: 300/834, loss: 0.45234, lr: 1.306529, top1: 0.39141, throughput: 312.03 | 2022-04-11 01:32:43.265 [rank:1] [train], epoch: 4/50, iter: 400/834, loss: 0.44823, lr: 1.342462, top1: 0.39427, throughput: 312.33 | 2022-04-11 01:33:44.734 [rank:5] [train], epoch: 4/50, iter: 400/834, loss: 0.44493, lr: 1.342462, top1: 0.39891, throughput: 311.95 | 2022-04-11 01:33:44.777 [rank:4] [train], epoch: 4/50, iter: 400/834, loss: 0.44685, lr: 1.342462, top1: 0.39526, throughput: 312.05 | 2022-04-11 01:33:44.781 [rank:6] [train], epoch: 4/50, iter: 400/834, loss: 0.44849, lr: 1.342462, top1: 0.39349, throughput: 311.95 | 2022-04-11 01:33:44.795 [rank:3] [train], epoch: 4/50, iter: 400/834, loss: 0.44797, lr: 1.342462, top1: 0.39526, throughput: 311.93 | 2022-04-11 01:33:44.813 [rank:0] [train], epoch: 4/50, iter: 400/834, loss: 0.44946, lr: 1.342462, top1: 0.38906, throughput: 311.95 | 2022-04-11 01:33:44.814 [rank:2] [train], epoch: 4/50, iter: 400/834, loss: 0.44772, lr: 1.342462, top1: 0.39078, throughput: 311.41 | 2022-04-11 01:33:44.840 [rank:7] [train], epoch: 4/50, iter: 400/834, loss: 0.44519, lr: 1.342462, top1: 0.39953, throughput: 311.55 | 2022-04-11 01:33:44.874 [rank:2] [train], epoch: 4/50, iter: 500/834, loss: 0.44612, lr: 1.378395, top1: 0.39422, throughput: 314.32 | 2022-04-11 01:34:45.925 [rank:3] [train], epoch: 4/50, iter: 500/834, loss: 0.44449, lr: 1.378395, top1: 0.40620, throughput: 314.05 | 2022-04-11 01:34:45.949 [rank:1] [train], epoch: 4/50, iter: 500/834, loss: 0.44278, lr: 1.378395, top1: 0.39724, throughput: 313.56 | 2022-04-11 01:34:45.967 [rank:6] [train], epoch: 4/50, iter: 500/834, loss: 0.44434, lr: 1.378395, top1: 0.39536, throughput: 313.82 | 2022-04-11 01:34:45.977 [rank:4] [train], epoch: 4/50, iter: 500/834, loss: 0.44452, lr: 1.378395, top1: 0.40016, throughput: 313.71 | 2022-04-11 01:34:45.983 [rank:5] [train], epoch: 4/50, iter: 500/834, loss: 0.44555, lr: 1.378395, top1: 0.39526, throughput: 313.57 | 2022-04-11 01:34:46.007 [rank:0] [train], epoch: 4/50, iter: 500/834, loss: 0.44437, lr: 1.378395, top1: 0.39542, throughput: 313.70 | 2022-04-11 01:34:46.019 [rank:7] [train], epoch: 4/50, iter: 500/834, loss: 0.44492, lr: 1.378395, top1: 0.39682, throughput: 313.96 | 2022-04-11 01:34:46.029 [rank:2] [train], epoch: 4/50, iter: 600/834, loss: 0.44171, lr: 1.414328, top1: 0.39922, throughput: 311.44 | 2022-04-11 01:35:47.575 [rank:3] [train], epoch: 4/50, iter: 600/834, loss: 0.43884, lr: 1.414328, top1: 0.40870, throughput: 311.49 | 2022-04-11 01:35:47.589 [rank:0] [train], epoch: 4/50, iter: 600/834, loss: 0.44185, lr: 1.414328, top1: 0.40365, throughput: 311.80 | 2022-04-11 01:35:47.596 [rank:7] [train], epoch: 4/50, iter: 600/834, loss: 0.44250, lr: 1.414328, top1: 0.40135, throughput: 311.70 | 2022-04-11 01:35:47.627 [rank:5] [train], epoch: 4/50, iter: 600/834, loss: 0.44206, lr: 1.414328, top1: 0.40281, throughput: 311.57 | 2022-04-11 01:35:47.632 [rank:4] [train], epoch: 4/50, iter: 600/834, loss: 0.44330, lr: 1.414328, top1: 0.40156, throughput: 311.42 | 2022-04-11 01:35:47.635 [rank:1] [train], epoch: 4/50, iter: 600/834, loss: 0.43933, lr: 1.414328, top1: 0.40734, throughput: 311.31 | 2022-04-11 01:35:47.642 [rank:6] [train], epoch: 4/50, iter: 600/834, loss: 0.44131, lr: 1.414328, top1: 0.40958, throughput: 311.32 | 2022-04-11 01:35:47.650 [rank:4] [train], epoch: 4/50, iter: 700/834, loss: 0.43967, lr: 1.450261, top1: 0.40818, throughput: 313.47 | 2022-04-11 01:36:48.885 [rank:7] [train], epoch: 4/50, iter: 700/834, loss: 0.43948, lr: 1.450261, top1: 0.40651, throughput: 313.23 | 2022-04-11 01:36:48.923 [rank:0] [train], epoch: 4/50, iter: 700/834, loss: 0.43828, lr: 1.450261, top1: 0.40870, throughput: 313.02 | 2022-04-11 01:36:48.934 [rank:2] [train], epoch: 4/50, iter: 700/834, loss: 0.43921, lr: 1.450261, top1: 0.40651, throughput: 312.86 | 2022-04-11 01:36:48.945 [rank:5] [train], epoch: 4/50, iter: 700/834, loss: 0.43890, lr: 1.450261, top1: 0.40417, throughput: 313.03 | 2022-04-11 01:36:48.967 [rank:1] [train], epoch: 4/50, iter: 700/834, loss: 0.44228, lr: 1.450261, top1: 0.40417, throughput: 313.07 | 2022-04-11 01:36:48.971 [rank:3] [train], epoch: 4/50, iter: 700/834, loss: 0.43728, lr: 1.450261, top1: 0.40943, throughput: 312.63 | 2022-04-11 01:36:49.004 [rank:6] [train], epoch: 4/50, iter: 700/834, loss: 0.44201, lr: 1.450261, top1: 0.40302, throughput: 312.86 | 2022-04-11 01:36:49.019 [rank:6] [train], epoch: 4/50, iter: 800/834, loss: 0.43802, lr: 1.486194, top1: 0.41120, throughput: 314.51 | 2022-04-11 01:37:50.067 [rank:0] [train], epoch: 4/50, iter: 800/834, loss: 0.43494, lr: 1.486194, top1: 0.40750, throughput: 314.07 | 2022-04-11 01:37:50.068 [rank:2] [train], epoch: 4/50, iter: 800/834, loss: 0.43752, lr: 1.486194, top1: 0.40781, throughput: 314.06 | 2022-04-11 01:37:50.080 [rank:3] [train], epoch: 4/50, iter: 800/834, loss: 0.43721, lr: 1.486194, top1: 0.40990, throughput: 314.23 | 2022-04-11 01:37:50.106 [rank:7] [train], epoch: 4/50, iter: 800/834, loss: 0.43905, lr: 1.486194, top1: 0.40589, throughput: 313.76 | 2022-04-11 01:37:50.117 [rank:1] [train], epoch: 4/50, iter: 800/834, loss: 0.43688, lr: 1.486194, top1: 0.41000, throughput: 313.99 | 2022-04-11 01:37:50.119 [rank:5] [train], epoch: 4/50, iter: 800/834, loss: 0.43971, lr: 1.486194, top1: 0.40682, throughput: 313.97 | 2022-04-11 01:37:50.119 [rank:4] [train], epoch: 4/50, iter: 800/834, loss: 0.43675, lr: 1.486194, top1: 0.41109, throughput: 313.46 | 2022-04-11 01:37:50.138 [rank:2] [train], epoch: 4/50, iter: 834/834, loss: 0.43664, lr: 1.498411, top1: 0.40349, throughput: 311.16 | 2022-04-11 01:38:11.060 [rank:1] [train], epoch: 4/50, iter: 834/834, loss: 0.43521, lr: 1.498411, top1: 0.41100, throughput: 311.62 | 2022-04-11 01:38:11.068 [rank:4] [train], epoch: 4/50, iter: 834/834, loss: 0.43769, lr: 1.498411, top1: 0.41207, throughput: 311.84 | 2022-04-11 01:38:11.071 [rank:0] [train], epoch: 4/50, iter: 834/834, loss: 0.43313, lr: 1.498411, top1: 0.42387, throughput: 310.69 | 2022-04-11 01:38:11.079 [rank:3] [train], epoch: 4/50, iter: 834/834, loss: 0.43854, lr: 1.498411, top1: 0.40717, throughput: 311.05 | 2022-04-11 01:38:11.093 [rank:7] [train], epoch: 4/50, iter: 834/834, loss: 0.43545, lr: 1.498411, top1: 0.41131, throughput: 311.02 | 2022-04-11 01:38:11.106 [rank:6] [train], epoch: 4/50, iter: 834/834, loss: 0.43402, lr: 1.498411, top1: 0.41131, throughput: 309.95 | 2022-04-11 01:38:11.128 [rank:5] [train], epoch: 4/50, iter: 834/834, loss: 0.43460, lr: 1.498411, top1: 0.41559, throughput: 310.73 | 2022-04-11 01:38:11.128 [rank:0] [eval], epoch: 4/50, iter: 125/125, loss: 0.00000, lr: 1.498411, top1: 0.38512, throughput: 491.33 | 2022-04-11 01:38:23.800 [rank:7] [eval], epoch: 4/50, iter: 125/125, loss: 0.00000, lr: 1.498411, top1: 0.37984, throughput: 492.11 | 2022-04-11 01:38:23.807 [rank:2] [eval], epoch: 4/50, iter: 125/125, loss: 0.00000, lr: 1.498411, top1: 0.37040, throughput: 490.09 | 2022-04-11 01:38:23.812 [rank:6] [eval], epoch: 4/50, iter: 125/125, loss: 0.00000, lr: 1.498411, top1: 0.36352, throughput: 492.60 | 2022-04-11 01:38:23.816 [rank:4] [eval], epoch: 4/50, iter: 125/125, loss: 0.00000, lr: 1.498411, top1: 0.35872, throughput: 490.16 | 2022-04-11 01:38:23.822 [rank:1] [eval], epoch: 4/50, iter: 125/125, loss: 0.00000, lr: 1.498411, top1: 0.37248, throughput: 489.97 | 2022-04-11 01:38:23.823 [rank:5] [eval], epoch: 4/50, iter: 125/125, loss: 0.00000, lr: 1.498411, top1: 0.35568, throughput: 492.24 | 2022-04-11 01:38:23.825 [rank:3] [eval], epoch: 4/50, iter: 125/125, loss: 0.00000, lr: 1.498411, top1: 0.37216, throughput: 489.82 | 2022-04-11 01:38:23.853 [rank:2] [train], epoch: 5/50, iter: 100/834, loss: 0.43006, lr: 1.496603, top1: 0.41651, throughput: 311.96 | 2022-04-11 01:39:25.359 [rank:3] [train], epoch: 5/50, iter: 100/834, loss: 0.43196, lr: 1.496603, top1: 0.41693, throughput: 312.15 | 2022-04-11 01:39:25.361 [rank:1] [train], epoch: 5/50, iter: 100/834, loss: 0.42918, lr: 1.496603, top1: 0.42036, throughput: 312.00 | 2022-04-11 01:39:25.363 [rank:6] [train], epoch: 5/50, iter: 100/834, loss: 0.42798, lr: 1.496603, top1: 0.42656, throughput: 311.92 | 2022-04-11 01:39:25.371 [rank:7] [train], epoch: 5/50, iter: 100/834, loss: 0.42688, lr: 1.496603, top1: 0.42974, throughput: 311.84 | 2022-04-11 01:39:25.376 [rank:0] [train], epoch: 5/50, iter: 100/834, loss: 0.42882, lr: 1.496603, top1: 0.42505, throughput: 311.65 | 2022-04-11 01:39:25.408 [rank:4] [train], epoch: 5/50, iter: 100/834, loss: 0.43084, lr: 1.496603, top1: 0.42005, throughput: 311.76 | 2022-04-11 01:39:25.408 [rank:5] [train], epoch: 5/50, iter: 100/834, loss: 0.42861, lr: 1.496603, top1: 0.42198, throughput: 312.12 | 2022-04-11 01:39:25.340 [rank:6] [train], epoch: 5/50, iter: 200/834, loss: 0.42625, lr: 1.494753, top1: 0.42948, throughput: 311.70 | 2022-04-11 01:40:26.969 [rank:7] [train], epoch: 5/50, iter: 200/834, loss: 0.42827, lr: 1.494753, top1: 0.42687, throughput: 311.70 | 2022-04-11 01:40:26.975 [rank:1] [train], epoch: 5/50, iter: 200/834, loss: 0.42755, lr: 1.494753, top1: 0.42802, throughput: 311.62 | 2022-04-11 01:40:26.977 [rank:0] [train], epoch: 5/50, iter: 200/834, loss: 0.42599, lr: 1.494753, top1: 0.42802, throughput: 311.80 | 2022-04-11 01:40:26.986 [rank:5] [train], epoch: 5/50, iter: 200/834, loss: 0.42815, lr: 1.494753, top1: 0.42547, throughput: 311.40 | 2022-04-11 01:40:26.997 [rank:2] [train], epoch: 5/50, iter: 200/834, loss: 0.42738, lr: 1.494753, top1: 0.42599, throughput: 311.46 | 2022-04-11 01:40:27.003 [rank:4] [train], epoch: 5/50, iter: 200/834, loss: 0.42486, lr: 1.494753, top1: 0.43057, throughput: 312.06 | 2022-04-11 01:40:26.935 [rank:3] [train], epoch: 5/50, iter: 200/834, loss: 0.42525, lr: 1.494753, top1: 0.43161, throughput: 311.29 | 2022-04-11 01:40:27.040 [rank:6] [train], epoch: 5/50, iter: 300/834, loss: 0.42224, lr: 1.492861, top1: 0.43417, throughput: 313.34 | 2022-04-11 01:41:28.244 [rank:1] [train], epoch: 5/50, iter: 300/834, loss: 0.42264, lr: 1.492861, top1: 0.43464, throughput: 313.36 | 2022-04-11 01:41:28.248 [rank:4] [train], epoch: 5/50, iter: 300/834, loss: 0.42373, lr: 1.492861, top1: 0.43255, throughput: 313.02 | 2022-04-11 01:41:28.273 [rank:7] [train], epoch: 5/50, iter: 300/834, loss: 0.42598, lr: 1.492861, top1: 0.42667, throughput: 313.16 | 2022-04-11 01:41:28.285 [rank:2] [train], epoch: 5/50, iter: 300/834, loss: 0.42729, lr: 1.492861, top1: 0.42911, throughput: 313.30 | 2022-04-11 01:41:28.287 [rank:5] [train], epoch: 5/50, iter: 300/834, loss: 0.42487, lr: 1.492861, top1: 0.42771, throughput: 313.20 | 2022-04-11 01:41:28.299 [rank:0] [train], epoch: 5/50, iter: 300/834, loss: 0.42726, lr: 1.492861, top1: 0.42672, throughput: 313.13 | 2022-04-11 01:41:28.303 [rank:3] [train], epoch: 5/50, iter: 300/834, loss: 0.42233, lr: 1.492861, top1: 0.43302, throughput: 313.36 | 2022-04-11 01:41:28.312 [rank:6] [train], epoch: 5/50, iter: 400/834, loss: 0.42249, lr: 1.490929, top1: 0.43083, throughput: 313.43 | 2022-04-11 01:42:29.501 [rank:1] [train], epoch: 5/50, iter: 400/834, loss: 0.42148, lr: 1.490929, top1: 0.43203, throughput: 313.34 | 2022-04-11 01:42:29.523 [rank:5] [train], epoch: 5/50, iter: 400/834, loss: 0.42126, lr: 1.490929, top1: 0.43427, throughput: 313.55 | 2022-04-11 01:42:29.533 [rank:4] [train], epoch: 5/50, iter: 400/834, loss: 0.42114, lr: 1.490929, top1: 0.43589, throughput: 313.41 | 2022-04-11 01:42:29.535 [rank:7] [train], epoch: 5/50, iter: 400/834, loss: 0.42332, lr: 1.490929, top1: 0.43260, throughput: 313.46 | 2022-04-11 01:42:29.536 [rank:3] [train], epoch: 5/50, iter: 400/834, loss: 0.42040, lr: 1.490929, top1: 0.43422, throughput: 313.38 | 2022-04-11 01:42:29.580 [rank:0] [train], epoch: 5/50, iter: 400/834, loss: 0.42194, lr: 1.490929, top1: 0.43318, throughput: 313.29 | 2022-04-11 01:42:29.589 [rank:2] [train], epoch: 5/50, iter: 400/834, loss: 0.42211, lr: 1.490929, top1: 0.43219, throughput: 313.16 | 2022-04-11 01:42:29.597 [rank:0] [train], epoch: 5/50, iter: 500/834, loss: 0.41966, lr: 1.488956, top1: 0.43896, throughput: 313.74 | 2022-04-11 01:43:30.786 [rank:6] [train], epoch: 5/50, iter: 500/834, loss: 0.42103, lr: 1.488956, top1: 0.43880, throughput: 313.15 | 2022-04-11 01:43:30.814 [rank:4] [train], epoch: 5/50, iter: 500/834, loss: 0.41681, lr: 1.488956, top1: 0.43891, throughput: 313.31 | 2022-04-11 01:43:30.817 [rank:3] [train], epoch: 5/50, iter: 500/834, loss: 0.42039, lr: 1.488956, top1: 0.44016, throughput: 313.45 | 2022-04-11 01:43:30.835 [rank:5] [train], epoch: 5/50, iter: 500/834, loss: 0.41734, lr: 1.488956, top1: 0.43896, throughput: 313.20 | 2022-04-11 01:43:30.835 [rank:1] [train], epoch: 5/50, iter: 500/834, loss: 0.42137, lr: 1.488956, top1: 0.43802, throughput: 313.02 | 2022-04-11 01:43:30.861 [rank:7] [train], epoch: 5/50, iter: 500/834, loss: 0.42031, lr: 1.488956, top1: 0.43833, throughput: 313.00 | 2022-04-11 01:43:30.877 [rank:2] [train], epoch: 5/50, iter: 500/834, loss: 0.42012, lr: 1.488956, top1: 0.43646, throughput: 313.13 | 2022-04-11 01:43:30.914 [rank:2] [train], epoch: 5/50, iter: 600/834, loss: 0.41667, lr: 1.486941, top1: 0.44130, throughput: 313.83 | 2022-04-11 01:44:32.094 [rank:5] [train], epoch: 5/50, iter: 600/834, loss: 0.41505, lr: 1.486941, top1: 0.44589, throughput: 313.40 | 2022-04-11 01:44:32.100 [rank:3] [train], epoch: 5/50, iter: 600/834, loss: 0.41684, lr: 1.486941, top1: 0.44667, throughput: 313.32 | 2022-04-11 01:44:32.114 [rank:1] [train], epoch: 5/50, iter: 600/834, loss: 0.41693, lr: 1.486941, top1: 0.44219, throughput: 313.40 | 2022-04-11 01:44:32.124 [rank:6] [train], epoch: 5/50, iter: 600/834, loss: 0.41531, lr: 1.486941, top1: 0.44802, throughput: 313.11 | 2022-04-11 01:44:32.133 [rank:0] [train], epoch: 5/50, iter: 600/834, loss: 0.42042, lr: 1.486941, top1: 0.43859, throughput: 312.90 | 2022-04-11 01:44:32.149 [rank:7] [train], epoch: 5/50, iter: 600/834, loss: 0.41690, lr: 1.486941, top1: 0.44359, throughput: 313.29 | 2022-04-11 01:44:32.163 [rank:4] [train], epoch: 5/50, iter: 600/834, loss: 0.42078, lr: 1.486941, top1: 0.43729, throughput: 312.97 | 2022-04-11 01:44:32.164 [rank:6] [train], epoch: 5/50, iter: 700/834, loss: 0.41647, lr: 1.484886, top1: 0.44271, throughput: 313.64 | 2022-04-11 01:45:33.351 [rank:2] [train], epoch: 5/50, iter: 700/834, loss: 0.41410, lr: 1.484886, top1: 0.44755, throughput: 313.43 | 2022-04-11 01:45:33.353 [rank:7] [train], epoch: 5/50, iter: 700/834, loss: 0.41345, lr: 1.484886, top1: 0.44854, throughput: 313.70 | 2022-04-11 01:45:33.369 [rank:0] [train], epoch: 5/50, iter: 700/834, loss: 0.41611, lr: 1.484886, top1: 0.43719, throughput: 313.54 | 2022-04-11 01:45:33.386 [rank:1] [train], epoch: 5/50, iter: 700/834, loss: 0.41311, lr: 1.484886, top1: 0.44776, throughput: 313.40 | 2022-04-11 01:45:33.388 [rank:4] [train], epoch: 5/50, iter: 700/834, loss: 0.41306, lr: 1.484886, top1: 0.44833, throughput: 313.58 | 2022-04-11 01:45:33.393 [rank:5] [train], epoch: 5/50, iter: 700/834, loss: 0.41425, lr: 1.484886, top1: 0.44677, throughput: 313.24 | 2022-04-11 01:45:33.395 [rank:3] [train], epoch: 5/50, iter: 700/834, loss: 0.41544, lr: 1.484886, top1: 0.44677, throughput: 313.01 | 2022-04-11 01:45:33.455 [rank:1] [train], epoch: 5/50, iter: 800/834, loss: 0.41444, lr: 1.482790, top1: 0.44859, throughput: 312.34 | 2022-04-11 01:46:34.860 [rank:6] [train], epoch: 5/50, iter: 800/834, loss: 0.41287, lr: 1.482790, top1: 0.45161, throughput: 312.13 | 2022-04-11 01:46:34.863 [rank:7] [train], epoch: 5/50, iter: 800/834, loss: 0.41114, lr: 1.482790, top1: 0.45286, throughput: 312.13[rank:5] [train], epoch: 5/50, iter: 800/834, loss: 0.41442, lr: 1.482790, top1: 0.44698, throughput: 312.26 | 2022-04-11 01:46:34.881| 2022-04-11 01:46:34.881 [rank:4] [train], epoch: 5/50, iter: 800/834, loss: 0.41421, lr: 1.482790, top1: 0.45167, throughput: 312.16 | 2022-04-11 01:46:34.900 [rank:0] [train], epoch: 5/50, iter: 800/834, loss: 0.41174, lr: 1.482790, top1: 0.44964, throughput: 312.03 | 2022-04-11 01:46:34.918 [rank:2] [train], epoch: 5/50, iter: 800/834, loss: 0.41216, lr: 1.482790, top1: 0.44979, throughput: 311.70 | 2022-04-11 01:46:34.951 [rank:3] [train], epoch: 5/50, iter: 800/834, loss: 0.41539, lr: 1.482790, top1: 0.44781, throughput: 312.73 | 2022-04-11 01:46:34.850 [rank:5] [train], epoch: 5/50, iter: 834/834, loss: 0.41582, lr: 1.482068, top1: 0.44654, throughput: 310.32 | 2022-04-11 01:46:55.918 [rank:6] [train], epoch: 5/50, iter: 834/834, loss: 0.41050, lr: 1.482068, top1: 0.45757, throughput: 310.01 | 2022-04-11 01:46:55.920 [rank:4] [train], epoch: 5/50, iter: 834/834, loss: 0.41190, lr: 1.482068, top1: 0.45282, throughput: 310.51 | 2022-04-11 01:46:55.923 [rank:0] [train], epoch: 5/50, iter: 834/834, loss: 0.40563, lr: 1.482068, top1: 0.46584, throughput: 310.72 | 2022-04-11 01:46:55.928 [rank:2] [train], epoch: 5/50, iter: 834/834, loss: 0.41072, lr: 1.482068, top1: 0.45573, throughput: 311.19[rank:3] [train], epoch: 5/50, iter: 834/834, loss: 0.40866, lr: 1.482068, top1: 0.44715, throughput: 309.69 | 2022-04-11 01:46:55.929 | 2022-04-11 01:46:55.929 [rank:7] [train], epoch: 5/50, iter: 834/834, loss: 0.41220, lr: 1.482068, top1: 0.45481, throughput: 310.14 | 2022-04-11 01:46:55.930 [rank:1] [train], epoch: 5/50, iter: 834/834, loss: 0.40633, lr: 1.482068, top1: 0.45159, throughput: 309.66 | 2022-04-11 01:46:55.941 [rank:2] [eval], epoch: 5/50, iter: 125/125, loss: 0.00000, lr: 1.482068, top1: 0.45648, throughput: 483.85 | 2022-04-11 01:47:08.846 [rank:1] [eval], epoch: 5/50, iter: 125/125, loss: 0.00000, lr: 1.482068, top1: 0.46800, throughput: 484.18 | 2022-04-11 01:47:08.849 [rank:4] [eval], epoch: 5/50, iter: 125/125, loss: 0.00000, lr: 1.482068, top1: 0.45264, throughput: 483.51 | 2022-04-11 01:47:08.849 [rank:5] [eval], epoch: 5/50, iter: 125/125, loss: 0.00000, lr: 1.482068, top1: 0.44784, throughput: 483.28 | 2022-04-11 01:47:08.850 [rank:6] [eval], epoch: 5/50, iter: 125/125, loss: 0.00000, lr: 1.482068, top1: 0.45360, throughput: 483.28 | 2022-04-11 01:47:08.852 [rank:7] [eval], epoch: 5/50, iter: 125/125, loss: 0.00000, lr: 1.482068, top1: 0.46592, throughput: 483.63 | 2022-04-11 01:47:08.853 [rank:0] [eval], epoch: 5/50, iter: 125/125, loss: 0.00000, lr: 1.482068, top1: 0.46592, throughput: 483.19 | 2022-04-11 01:47:08.863 [rank:3] [eval], epoch: 5/50, iter: 125/125, loss: 0.00000, lr: 1.482068, top1: 0.45648, throughput: 482.25 | 2022-04-11 01:47:08.889 [rank:4] [train], epoch: 6/50, iter: 100/834, loss: 0.40498, lr: 1.479918, top1: 0.46083, throughput: 313.84 | 2022-04-11 01:48:10.027 [rank:7] [train], epoch: 6/50, iter: 100/834, loss: 0.40646, lr: 1.479918, top1: 0.45974, throughput: 313.68 | 2022-04-11 01:48:10.063 [rank:1] [train], epoch: 6/50, iter: 100/834, loss: 0.40672, lr: 1.479918, top1: 0.45880, throughput: 313.60 | 2022-04-11 01:48:10.073 [rank:6] [train], epoch: 6/50, iter: 100/834, loss: 0.40476, lr: 1.479918, top1: 0.46380, throughput: 313.55 | 2022-04-11 01:48:10.087 [rank:2] [train], epoch: 6/50, iter: 100/834, loss: 0.40799, lr: 1.479918, top1: 0.45344, throughput: 313.52 | 2022-04-11 01:48:10.087 [rank:0] [train], epoch: 6/50, iter: 100/834, loss: 0.40689, lr: 1.479918, top1: 0.45505, throughput: 313.53 | 2022-04-11 01:48:10.100 [rank:5] [train], epoch: 6/50, iter: 100/834, loss: 0.40391, lr: 1.479918, top1: 0.46552, throughput: 313.45 | 2022-04-11 01:48:10.104 [rank:3] [train], epoch: 6/50, iter: 100/834, loss: 0.40370, lr: 1.479918, top1: 0.46437, throughput: 313.60 | 2022-04-11 01:48:10.113 [rank:2] [train], epoch: 6/50, iter: 200/834, loss: 0.40554, lr: 1.477728, top1: 0.46115, throughput: 312.28 | 2022-04-11 01:49:11.571 [rank:0] [train], epoch: 6/50, iter: 200/834, loss: 0.40302, lr: 1.477728, top1: 0.46432, throughput: 311.97 | 2022-04-11 01:49:11.644 [rank:5] [train], epoch: 6/50, iter: 200/834, loss: 0.40360, lr: 1.477728, top1: 0.46891, throughput: 311.98 | 2022-04-11 01:49:11.646 [rank:6] [train], epoch: 6/50, iter: 200/834, loss: 0.40315, lr: 1.477728, top1: 0.46661, throughput: 311.85 | 2022-04-11 01:49:11.655 [rank:3] [train], epoch: 6/50, iter: 200/834, loss: 0.40391, lr: 1.477728, top1: 0.46214, throughput: 311.88 | 2022-04-11 01:49:11.674 [rank:1] [train], epoch: 6/50, iter: 200/834, loss: 0.40294, lr: 1.477728, top1: 0.46370, throughput: 311.68 | 2022-04-11 01:49:11.675 [rank:7] [train], epoch: 6/50, iter: 200/834, loss: 0.40472, lr: 1.477728, top1: 0.46021, throughput: 311.62 | 2022-04-11 01:49:11.675 [rank:4] [train], epoch: 6/50, iter: 200/834, loss: 0.40309, lr: 1.477728, top1: 0.46661, throughput: 311.42 | 2022-04-11 01:49:11.680 [rank:2] [train], epoch: 6/50, iter: 300/834, loss: 0.39975, lr: 1.475497, top1: 0.47214, throughput: 311.80 | 2022-04-11 01:50:13.148 [rank:6] [train], epoch: 6/50, iter: 300/834, loss: 0.40448, lr: 1.475497, top1: 0.46505, throughput: 312.22 | 2022-04-11 01:50:13.149 [rank:5] [train], epoch: 6/50, iter: 300/834, loss: 0.40313, lr: 1.475497, top1: 0.46302, throughput: 312.03 | 2022-04-11 01:50:13.179 [rank:4] [train], epoch: 6/50, iter: 300/834, loss: 0.40232, lr: 1.475497, top1: 0.47042, throughput: 312.17 | 2022-04-11 01:50:13.185 [rank:7] [train], epoch: 6/50, iter: 300/834, loss: 0.40230, lr: 1.475497, top1: 0.46995, throughput: 312.10 | 2022-04-11 01:50:13.194 [rank:3] [train], epoch: 6/50, iter: 300/834, loss: 0.40451, lr: 1.475497, top1: 0.46307, throughput: 312.03 | 2022-04-11 01:50:13.208 [rank:1] [train], epoch: 6/50, iter: 300/834, loss: 0.40568, lr: 1.475497, top1: 0.46073, throughput: 311.98 | 2022-04-11 01:50:13.217 [rank:0] [train], epoch: 6/50, iter: 300/834, loss: 0.40255, lr: 1.475497, top1: 0.46682, throughput: 311.71 | 2022-04-11 01:50:13.240 [rank:3] [train], epoch: 6/50, iter: 400/834, loss: 0.39970, lr: 1.473226, top1: 0.47354, throughput: 312.28 | 2022-04-11 01:51:14.691 [rank:4] [train], epoch: 6/50, iter: 400/834, loss: 0.40371, lr: 1.473226, top1: 0.46646, throughput: 312.13 | 2022-04-11 01:51:14.698 [rank:2] [train], epoch: 6/50, iter: 400/834, loss: 0.40221, lr: 1.473226, top1: 0.46865, throughput: 311.94 | 2022-04-11 01:51:14.699 [rank:5] [train], epoch: 6/50, iter: 400/834, loss: 0.40215, lr: 1.473226, top1: 0.46953, throughput: 312.07 | 2022-04-11 01:51:14.705 [rank:1] [train], epoch: 6/50, iter: 400/834, loss: 0.39943, lr: 1.473226, top1: 0.46740, throughput: 312.25 | 2022-04-11 01:51:14.707 [rank:6] [train], epoch: 6/50, iter: 400/834, loss: 0.40236, lr: 1.473226, top1: 0.47292, throughput: 312.17 | 2022-04-11 01:51:14.654 [rank:7] [train], epoch: 6/50, iter: 400/834, loss: 0.40106, lr: 1.473226, top1: 0.46760, throughput: 311.93 | 2022-04-11 01:51:14.746 [rank:0] [train], epoch: 6/50, iter: 400/834, loss: 0.40302, lr: 1.473226, top1: 0.46240, throughput: 312.07 | 2022-04-11 01:51:14.765 [rank:7] [train], epoch: 6/50, iter: 500/834, loss: 0.40341, lr: 1.470915, top1: 0.46776, throughput: 312.07 | 2022-04-11 01:52:16.270 [rank:1] [train], epoch: 6/50, iter: 500/834, loss: 0.40314, lr: 1.470915, top1: 0.46833, throughput: 311.83 | 2022-04-11 01:52:16.279 [rank:4] [train], epoch: 6/50, iter: 500/834, loss: 0.40110, lr: 1.470915, top1: 0.47052, throughput: 311.74 | 2022-04-11 01:52:16.288 [rank:5] [train], epoch: 6/50, iter: 500/834, loss: 0.39682, lr: 1.470915, top1: 0.47542, throughput: 311.66 | 2022-04-11 01:52:16.310 [rank:6] [train], epoch: 6/50, iter: 500/834, loss: 0.40406, lr: 1.470915, top1: 0.46474, throughput: 311.39 | 2022-04-11 01:52:16.314 [rank:3] [train], epoch: 6/50, iter: 500/834, loss: 0.40142, lr: 1.470915, top1: 0.46885, throughput: 311.54 | 2022-04-11 01:52:16.320 [rank:0] [train], epoch: 6/50, iter: 500/834, loss: 0.40144, lr: 1.470915, top1: 0.47156, throughput: 311.85 | 2022-04-11 01:52:16.334 [rank:2] [train], epoch: 6/50, iter: 500/834, loss: 0.40220, lr: 1.470915, top1: 0.47161, throughput: 311.50 | 2022-04-11 01:52:16.337 [rank:7] [train], epoch: 6/50, iter: 600/834, loss: 0.40218, lr: 1.468564, top1: 0.46339, throughput: 312.67 | 2022-04-11 01:53:17.677 [rank:4] [train], epoch: 6/50, iter: 600/834, loss: 0.40159, lr: 1.468564, top1: 0.46922, throughput: 312.72 | 2022-04-11 01:53:17.685 [rank:6] [train], epoch: 6/50, iter: 600/834, loss: 0.39973, lr: 1.468564, top1: 0.47068, throughput: 312.79 | 2022-04-11 01:53:17.697 [rank:5] [train], epoch: 6/50, iter: 600/834, loss: 0.40003, lr: 1.468564, top1: 0.47146, throughput: 312.72 | 2022-04-11 01:53:17.706 [rank:1] [train], epoch: 6/50, iter: 600/834, loss: 0.39875, lr: 1.468564, top1: 0.47276, throughput: 312.53 | 2022-04-11 01:53:17.714 [rank:3] [train], epoch: 6/50, iter: 600/834, loss: 0.40084, lr: 1.468564, top1: 0.47109, throughput: 312.68 | 2022-04-11 01:53:17.724 [rank:0] [train], epoch: 6/50, iter: 600/834, loss: 0.40095, lr: 1.468564, top1: 0.46750, throughput: 312.64 | 2022-04-11 01:53:17.746 [rank:2] [train], epoch: 6/50, iter: 600/834, loss: 0.39951, lr: 1.468564, top1: 0.46964, throughput: 312.63 | 2022-04-11 01:53:17.752 [rank:4] [train], epoch: 6/50, iter: 700/834, loss: 0.39922, lr: 1.466173, top1: 0.47406, throughput: 313.99 | 2022-04-11 01:54:18.833 [rank:1] [train], epoch: 6/50, iter: 700/834, loss: 0.39734, lr: 1.466173, top1: 0.47359, throughput: 313.99 | 2022-04-11 01:54:18.863 [rank:6] [train], epoch: 6/50, iter: 700/834, loss: 0.39986, lr: 1.466173, top1: 0.47370, throughput: 313.87 | 2022-04-11 01:54:18.868 [rank:0] [train], epoch: 6/50, iter: 700/834, loss: 0.39495, lr: 1.466173, top1: 0.47896, throughput: 314.10 | 2022-04-11 01:54:18.873 [rank:5] [train], epoch: 6/50, iter: 700/834, loss: 0.39551, lr: 1.466173, top1: 0.48000, throughput: 313.88 | 2022-04-11 01:54:18.875 [rank:7] [train], epoch: 6/50, iter: 700/834, loss: 0.39784, lr: 1.466173, top1: 0.47505, throughput: 313.72 | 2022-04-11 01:54:18.879 [rank:2] [train], epoch: 6/50, iter: 700/834, loss: 0.39793, lr: 1.466173, top1: 0.47729, throughput: 314.07 | 2022-04-11 01:54:18.885 [rank:3] [train], epoch: 6/50, iter: 700/834, loss: 0.39822, lr: 1.466173, top1: 0.47865, throughput: 313.77 | 2022-04-11 01:54:18.916 [rank:4] [train], epoch: 6/50, iter: 800/834, loss: 0.39630, lr: 1.463742, top1: 0.47995, throughput: 314.28 | 2022-04-11 01:55:19.925 [rank:7] [train], epoch: 6/50, iter: 800/834, loss: 0.39914, lr: 1.463742, top1: 0.47661, throughput: 314.43 | 2022-04-11 01:55:19.942 [rank:0] [train], epoch: 6/50, iter: 800/834, loss: 0.39503, lr: 1.463742, top1: 0.47937, throughput: 314.33 | 2022-04-11 01:55:19.954 [rank:5] [train], epoch: 6/50, iter: 800/834, loss: 0.39686, lr: 1.463742, top1: 0.47776, throughput: 314.34 | 2022-04-11 01:55:19.955 [rank:2] [train], epoch: 6/50, iter: 800/834, loss: 0.39674, lr: 1.463742, top1: 0.47510, throughput: 314.27 | 2022-04-11 01:55:19.978 [rank:3] [train], epoch: 6/50, iter: 800/834, loss: 0.39737, lr: 1.463742, top1: 0.47969, throughput: 314.42 | 2022-04-11 01:55:19.980 [rank:1] [train], epoch: 6/50, iter: 800/834, loss: 0.39562, lr: 1.463742, top1: 0.48120, throughput: 314.10 | 2022-04-11 01:55:19.990 [rank:6] [train], epoch: 6/50, iter: 800/834, loss: 0.39564, lr: 1.463742, top1: 0.47797, throughput: 314.12 | 2022-04-11 01:55:19.991 [rank:2] [train], epoch: 6/50, iter: 834/834, loss: 0.40038, lr: 1.462907, top1: 0.46982, throughput: 309.55 | 2022-04-11 01:55:41.067 [rank:7] [train], epoch: 6/50, iter: 834/834, loss: 0.39798, lr: 1.462907, top1: 0.47442, throughput: 309.00 | 2022-04-11 01:55:41.068 [rank:5] [train], epoch: 6/50, iter: 834/834, loss: 0.39386, lr: 1.462907, top1: 0.48085, throughput: 309.19 | 2022-04-11 01:55:41.068 [rank:0] [train], epoch: 6/50, iter: 834/834, loss: 0.39340, lr: 1.462907, top1: 0.48744, throughput: 309.06 | 2022-04-11 01:55:41.076 [rank:3] [train], epoch: 6/50, iter: 834/834, loss: 0.39375, lr: 1.462907, top1: 0.47871, throughput: 309.52 | 2022-04-11 01:55:41.071 [rank:6] [train], epoch: 6/50, iter: 834/834, loss: 0.39515, lr: 1.462907, top1: 0.47044, throughput: 309.58 | 2022-04-11 01:55:41.078 [rank:1] [train], epoch: 6/50, iter: 834/834, loss: 0.39461, lr: 1.462907, top1: 0.48070, throughput: 309.57 | 2022-04-11 01:55:41.078 [rank:4] [train], epoch: 6/50, iter: 834/834, loss: 0.39769, lr: 1.462907, top1: 0.47518, throughput: 307.95 | 2022-04-11 01:55:41.123 [rank:0] [eval], epoch: 6/50, iter: 125/125, loss: 0.00000, lr: 1.462907, top1: 0.47792, throughput: 491.44 | 2022-04-11 01:55:53.794 [rank:4] [eval], epoch: 6/50, iter: 125/125, loss: 0.00000, lr: 1.462907, top1: 0.46592, throughput: 493.23 | 2022-04-11 01:55:53.795 [rank:5] [eval], epoch: 6/50, iter: 125/125, loss: 0.00000, lr: 1.462907, top1: 0.45824, throughput: 491.02 | 2022-04-11 01:55:53.797 [rank:7] [eval], epoch: 6/50, iter: 125/125, loss: 0.00000, lr: 1.462907, top1: 0.47616, throughput: 490.86 | 2022-04-11 01:55:53.801 [rank:1] [eval], epoch: 6/50, iter: 125/125, loss: 0.00000, lr: 1.462907, top1: 0.47184, throughput: 491.22 | 2022-04-11 01:55:53.801 [rank:6] [eval], epoch: 6/50, iter: 125/125, loss: 0.00000, lr: 1.462907, top1: 0.46752, throughput: 491.21 | 2022-04-11 01:55:53.801 [rank:2] [eval], epoch: 6/50, iter: 125/125, loss: 0.00000, lr: 1.462907, top1: 0.47328, throughput: 490.57 | 2022-04-11 01:55:53.807 [rank:3] [eval], epoch: 6/50, iter: 125/125, loss: 0.00000, lr: 1.462907, top1: 0.46000, throughput: 489.49 | 2022-04-11 01:55:53.839 [rank:4] [train], epoch: 7/50, iter: 100/834, loss: 0.38934, lr: 1.460424, top1: 0.48953, throughput: 313.15 | 2022-04-11 01:56:55.108 [rank:1] [train], epoch: 7/50, iter: 100/834, loss: 0.39115, lr: 1.460424, top1: 0.48891, throughput: 313.16 | 2022-04-11 01:56:55.112 [rank:3] [train], epoch: 7/50, iter: 100/834, loss: 0.39562, lr: 1.460424, top1: 0.48307, throughput: 313.35 | 2022-04-11 01:56:55.113 [rank:2] [train], epoch: 7/50, iter: 100/834, loss: 0.39113, lr: 1.460424, top1: 0.48448, throughput: 313.17 | 2022-04-11 01:56:55.116 [rank:5] [train], epoch: 7/50, iter: 100/834, loss: 0.38800, lr: 1.460424, top1: 0.49281, throughput: 313.10 | 2022-04-11 01:56:55.119 [rank:0] [train], epoch: 7/50, iter: 100/834, loss: 0.38721, lr: 1.460424, top1: 0.49406, throughput: 312.95 | 2022-04-11 01:56:55.146 [rank:6] [train], epoch: 7/50, iter: 100/834, loss: 0.39225, lr: 1.460424, top1: 0.48375, throughput: 312.84 | 2022-04-11 01:56:55.174 [rank:7] [train], epoch: 7/50, iter: 100/834, loss: 0.38994, lr: 1.460424, top1: 0.49135, throughput: 312.79 | 2022-04-11 01:56:55.183 [rank:2] [train], epoch: 7/50, iter: 200/834, loss: 0.39004, lr: 1.457901, top1: 0.48875, throughput: 313.34 | 2022-04-11 01:57:56.392 [rank:0] [train], epoch: 7/50, iter: 200/834, loss: 0.38822, lr: 1.457901, top1: 0.48937, throughput: 313.31 | 2022-04-11 01:57:56.428 [rank:7] [train], epoch: 7/50, iter: 200/834, loss: 0.39389, lr: 1.457901, top1: 0.48208, throughput: 313.46 | 2022-04-11 01:57:56.435 [rank:5] [train], epoch: 7/50, iter: 200/834, loss: 0.39131, lr: 1.457901, top1: 0.48589, throughput: 313.07 | 2022-04-11 01:57:56.448 [rank:1] [train], epoch: 7/50, iter: 200/834, loss: 0.39069, lr: 1.457901, top1: 0.49130, throughput: 312.97 | 2022-04-11 01:57:56.460 [rank:4] [train], epoch: 7/50, iter: 200/834, loss: 0.39003, lr: 1.457901, top1: 0.48375, throughput: 313.32 | 2022-04-11 01:57:56.386 [rank:3] [train], epoch: 7/50, iter: 200/834, loss: 0.38985, lr: 1.457901, top1: 0.48682, throughput: 312.88 | 2022-04-11 01:57:56.479 [rank:6] [train], epoch: 7/50, iter: 200/834, loss: 0.39074, lr: 1.457901, top1: 0.48573, throughput: 313.54 | 2022-04-11 01:57:56.410 [rank:1] [train], epoch: 7/50, iter: 300/834, loss: 0.39214, lr: 1.455340, top1: 0.48380, throughput: 314.81 | 2022-04-11 01:58:57.448 [rank:6] [train], epoch: 7/50, iter: 300/834, loss: 0.38813, lr: 1.455340, top1: 0.49266, throughput: 314.45 | 2022-04-11 01:58:57.469 [rank:4] [train], epoch: 7/50, iter: 300/834, loss: 0.38890, lr: 1.455340, top1: 0.48990, throughput: 314.31 | 2022-04-11 01:58:57.473 [rank:5] [train], epoch: 7/50, iter: 300/834, loss: 0.39224, lr: 1.455340, top1: 0.48219, throughput: 314.55 | 2022-04-11 01:58:57.488 [rank:2] [train], epoch: 7/50, iter: 300/834, loss: 0.39095, lr: 1.455340, top1: 0.48984, throughput: 314.17 | 2022-04-11 01:58:57.506 [rank:3] [train], epoch: 7/50, iter: 300/834, loss: 0.38688, lr: 1.455340, top1: 0.49365, throughput: 314.45 | 2022-04-11 01:58:57.538 [rank:7] [train], epoch: 7/50, iter: 300/834, loss: 0.38947, lr: 1.455340, top1: 0.48859, throughput: 314.22 | 2022-04-11 01:58:57.538 [rank:0] [train], epoch: 7/50, iter: 300/834, loss: 0.39084, lr: 1.455340, top1: 0.48521, throughput: 314.12 | 2022-04-11 01:58:57.552 [rank:3] [train], epoch: 7/50, iter: 400/834, loss: 0.38909, lr: 1.452739, top1: 0.49026, throughput: 312.23 | 2022-04-11 01:59:59.030 [rank:2] [train], epoch: 7/50, iter: 400/834, loss: 0.38988, lr: 1.452739, top1: 0.48937, throughput: 311.96 | 2022-04-11 01:59:59.053 [rank:4] [train], epoch: 7/50, iter: 400/834, loss: 0.38807, lr: 1.452739, top1: 0.48859, throughput: 311.73 | 2022-04-11 01:59:59.064 [rank:7] [train], epoch: 7/50, iter: 400/834, loss: 0.39121, lr: 1.452739, top1: 0.48474, throughput: 312.00 | 2022-04-11 01:59:59.077 [rank:0] [train], epoch: 7/50, iter: 400/834, loss: 0.38598, lr: 1.452739, top1: 0.49724, throughput: 312.07 | 2022-04-11 01:59:59.077 [rank:1] [train], epoch: 7/50, iter: 400/834, loss: 0.38857, lr: 1.452739, top1: 0.49193, throughput: 311.54 | 2022-04-11 01:59:59.078 [rank:5] [train], epoch: 7/50, iter: 400/834, loss: 0.38722, lr: 1.452739, top1: 0.49328, throughput: 311.63 | 2022-04-11 01:59:59.100 [rank:6] [train], epoch: 7/50, iter: 400/834, loss: 0.38435, lr: 1.452739, top1: 0.49786, throughput: 311.97 | 2022-04-11 01:59:59.013 [rank:6] [train], epoch: 7/50, iter: 500/834, loss: 0.38834, lr: 1.450099, top1: 0.48536, throughput: 313.16 | 2022-04-11 02:01:00.323 [rank:4] [train], epoch: 7/50, iter: 500/834, loss: 0.39075, lr: 1.450099, top1: 0.48318, throughput: 313.32 | 2022-04-11 02:01:00.344 [rank:0] [train], epoch: 7/50, iter: 500/834, loss: 0.38680, lr: 1.450099, top1: 0.49406, throughput: 313.33 | 2022-04-11 02:01:00.354 [rank:7] [train], epoch: 7/50, iter: 500/834, loss: 0.38790, lr: 1.450099, top1: 0.49552, throughput: 313.28 | 2022-04-11 02:01:00.363 [rank:3] [train], epoch: 7/50, iter: 500/834, loss: 0.38617, lr: 1.450099, top1: 0.49271, throughput: 312.88 | 2022-04-11 02:01:00.396 [rank:2] [train], epoch: 7/50, iter: 500/834, loss: 0.38806, lr: 1.450099, top1: 0.49156, throughput: 312.97 | 2022-04-11 02:01:00.401 [rank:5] [train], epoch: 7/50, iter: 500/834, loss: 0.39090, lr: 1.450099, top1: 0.48427, throughput: 313.59 | 2022-04-11 02:01:00.326 [rank:1] [train], epoch: 7/50, iter: 500/834, loss: 0.38945, lr: 1.450099, top1: 0.49073, throughput: 312.69 | 2022-04-11 02:01:00.481 [rank:5] [train], epoch: 7/50, iter: 600/834, loss: 0.39133, lr: 1.447421, top1: 0.48505, throughput: 312.12 | 2022-04-11 02:02:01.840 [rank:1] [train], epoch: 7/50, iter: 600/834, loss: 0.38959, lr: 1.447421, top1: 0.48724, throughput: 312.76 | 2022-04-11 02:02:01.870 [rank:2] [train], epoch: 7/50, iter: 600/834, loss: 0.38776, lr: 1.447421, top1: 0.49427, throughput: 312.31 | 2022-04-11 02:02:01.878 [rank:6] [train], epoch: 7/50, iter: 600/834, loss: 0.38820, lr: 1.447421, top1: 0.49167, throughput: 311.84 | 2022-04-11 02:02:01.892 [rank:0] [train], epoch: 7/50, iter: 600/834, loss: 0.38695, lr: 1.447421, top1: 0.49891, throughput: 312.00 | 2022-04-11 02:02:01.892 [rank:7] [train], epoch: 7/50, iter: 600/834, loss: 0.38637, lr: 1.447421, top1: 0.49687, throughput: 311.99 | 2022-04-11 02:02:01.903 [rank:3] [train], epoch: 7/50, iter: 600/834, loss: 0.38966, lr: 1.447421, top1: 0.48734, throughput: 312.07 | 2022-04-11 02:02:01.920 [rank:4] [train], epoch: 7/50, iter: 600/834, loss: 0.38995, lr: 1.447421, top1: 0.48641, throughput: 312.15 | 2022-04-11 02:02:01.852 [rank:7] [train], epoch: 7/50, iter: 700/834, loss: 0.38852, lr: 1.444704, top1: 0.49120, throughput: 312.81 | 2022-04-11 02:03:03.282 [rank:6] [train], epoch: 7/50, iter: 700/834, loss: 0.38751, lr: 1.444704, top1: 0.49484, throughput: 312.63 | 2022-04-11 02:03:03.307 [rank:4] [train], epoch: 7/50, iter: 700/834, loss: 0.38635, lr: 1.444704, top1: 0.49583, throughput: 312.39 | 2022-04-11 02:03:03.314 [rank:0] [train], epoch: 7/50, iter: 700/834, loss: 0.38792, lr: 1.444704, top1: 0.49292, throughput: 312.54 | 2022-04-11 02:03:03.324 [rank:2] [train], epoch: 7/50, iter: 700/834, loss: 0.38663, lr: 1.444704, top1: 0.49656, throughput: 312.46 | 2022-04-11 02:03:03.325 [rank:5] [train], epoch: 7/50, iter: 700/834, loss: 0.38946, lr: 1.444704, top1: 0.48802, throughput: 312.17 | 2022-04-11 02:03:03.346 [rank:3] [train], epoch: 7/50, iter: 700/834, loss: 0.38596, lr: 1.444704, top1: 0.49531, throughput: 312.52 | 2022-04-11 02:03:03.358 [rank:1] [train], epoch: 7/50, iter: 700/834, loss: 0.38745, lr: 1.444704, top1: 0.49229, throughput: 312.21 | 2022-04-11 02:03:03.366 [rank:4] [train], epoch: 7/50, iter: 800/834, loss: 0.38766, lr: 1.441949, top1: 0.48781, throughput: 312.60 | 2022-04-11 02:04:04.735 [rank:6] [train], epoch: 7/50, iter: 800/834, loss: 0.38755, lr: 1.441949, top1: 0.49240, throughput: 312.40 | 2022-04-11 02:04:04.766 [rank:7] [train], epoch: 7/50, iter: 800/834, loss: 0.38738, lr: 1.441949, top1: 0.49432, throughput: 312.22 | 2022-04-11 02:04:04.777 [rank:5] [train], epoch: 7/50, iter: 800/834, loss: 0.38706, lr: 1.441949, top1: 0.49505, throughput: 312.45 | 2022-04-11 02:04:04.796 [rank:1] [train], epoch: 7/50, iter: 800/834, loss: 0.38777, lr: 1.441949, top1: 0.49391, throughput: 312.47 | 2022-04-11 02:04:04.813 [rank:0] [train], epoch: 7/50, iter: 800/834, loss: 0.38796, lr: 1.441949, top1: 0.49615, throughput: 312.24 | 2022-04-11 02:04:04.814 [rank:2] [train], epoch: 7/50, iter: 800/834, loss: 0.38395, lr: 1.441949, top1: 0.49880, throughput: 312.19 | 2022-04-11 02:04:04.825 [rank:3] [train], epoch: 7/50, iter: 800/834, loss: 0.38736, lr: 1.441949, top1: 0.49193, throughput: 312.29 | 2022-04-11 02:04:04.839 [rank:4] [train], epoch: 7/50, iter: 834/834, loss: 0.38563, lr: 1.441004, top1: 0.50046, throughput: 310.83 | 2022-04-11 02:04:25.736 [rank:0] [train], epoch: 7/50, iter: 834/834, loss: 0.38983, lr: 1.441004, top1: 0.48560, throughput: 311.26 | 2022-04-11 02:04:25.787 [rank:7] [train], epoch: 7/50, iter: 834/834, loss: 0.38274, lr: 1.441004, top1: 0.49540, throughput: 310.65 | 2022-04-11 02:04:25.791 [rank:1] [train], epoch: 7/50, iter: 834/834, loss: 0.38614, lr: 1.441004, top1: 0.49969, throughput: 310.70 | 2022-04-11 02:04:25.824 [rank:5] [train], epoch: 7/50, iter: 834/834, loss: 0.38291, lr: 1.441004, top1: 0.49525, throughput: 310.44 | 2022-04-11 02:04:25.824 [rank:6] [train], epoch: 7/50, iter: 834/834, loss: 0.38204, lr: 1.441004, top1: 0.49663, throughput: 309.97 | 2022-04-11 02:04:25.826 [rank:3] [train], epoch: 7/50, iter: 834/834, loss: 0.38708, lr: 1.441004, top1: 0.49831, throughput: 310.64 | 2022-04-11 02:04:25.854 [rank:2] [train], epoch: 7/50, iter: 834/834, loss: 0.38843, lr: 1.441004, top1: 0.49050, throughput: 310.43 | 2022-04-11 02:04:25.854 [rank:0] [eval], epoch: 7/50, iter: 125/125, loss: 0.00000, lr: 1.441004, top1: 0.49024, throughput: 485.34 | 2022-04-11 02:04:38.665 [rank:6] [eval], epoch: 7/50, iter: 125/125, loss: 0.00000, lr: 1.441004, top1: 0.48080, throughput: 486.75 | 2022-04-11 02:04:38.666 [rank:4] [eval], epoch: 7/50, iter: 125/125, loss: 0.00000, lr: 1.441004, top1: 0.47840, throughput: 483.19 | 2022-04-11 02:04:38.671 [rank:1] [eval], epoch: 7/50, iter: 125/125, loss: 0.00000, lr: 1.441004, top1: 0.48384, throughput: 485.86 | 2022-04-11 02:04:38.687 [rank:5] [eval], epoch: 7/50, iter: 125/125, loss: 0.00000, lr: 1.441004, top1: 0.46528, throughput: 485.82 | 2022-04-11 02:04:38.689 [rank:2] [eval], epoch: 7/50, iter: 125/125, loss: 0.00000, lr: 1.441004, top1: 0.47584, throughput: 486.92 | 2022-04-11 02:04:38.690 [rank:7] [eval], epoch: 7/50, iter: 125/125, loss: 0.00000, lr: 1.441004, top1: 0.48352, throughput: 484.42 | 2022-04-11 02:04:38.693 [rank:3] [eval], epoch: 7/50, iter: 125/125, loss: 0.00000, lr: 1.441004, top1: 0.46256, throughput: 485.73 | 2022-04-11 02:04:38.721 [rank:0] [train], epoch: 8/50, iter: 100/834, loss: 0.37647, lr: 1.438197, top1: 0.51125, throughput: 314.23 | 2022-04-11 02:05:39.767 [rank:4] [train], epoch: 8/50, iter: 100/834, loss: 0.37793, lr: 1.438197, top1: 0.50990, throughput: 314.10 | 2022-04-11 02:05:39.798 [rank:2] [train], epoch: 8/50, iter: 100/834, loss: 0.37723, lr: 1.438197, top1: 0.50885, throughput: 314.04 | 2022-04-11 02:05:39.829 [rank:3] [train], epoch: 8/50, iter: 100/834, loss: 0.38032, lr: 1.438197, top1: 0.50667, throughput: 314.19 | 2022-04-11 02:05:39.831 [rank:1] [train], epoch: 8/50, iter: 100/834, loss: 0.37967, lr: 1.438197, top1: 0.50880, throughput: 313.95 | 2022-04-11 02:05:39.843 [rank:7] [train], epoch: 8/50, iter: 100/834, loss: 0.37794, lr: 1.438197, top1: 0.50750, throughput: 313.97 | 2022-04-11 02:05:39.845 [rank:5] [train], epoch: 8/50, iter: 100/834, loss: 0.37992, lr: 1.438197, top1: 0.50448, throughput: 313.94 | 2022-04-11 02:05:39.846 [rank:6] [train], epoch: 8/50, iter: 100/834, loss: 0.37778, lr: 1.438197, top1: 0.50833, throughput: 313.55 | 2022-04-11 02:05:39.901 [rank:6] [train], epoch: 8/50, iter: 200/834, loss: 0.38015, lr: 1.435353, top1: 0.50510, throughput: 312.74[rank:1] [train], epoch: 8/50, iter: 200/834, loss: 0.38336, lr: 1.435353, top1: 0.49870, throughput: 312.45 | 2022-04-11 02:06:41.294 | 2022-04-11 02:06:41.294 [rank:0] [train], epoch: 8/50, iter: 200/834, loss: 0.38310, lr: 1.435353, top1: 0.50036, throughput: 311.92 | 2022-04-11 02:06:41.321 [rank:7] [train], epoch: 8/50, iter: 200/834, loss: 0.37882, lr: 1.435353, top1: 0.50984, throughput: 312.25 | 2022-04-11 02:06:41.334 [rank:3] [train], epoch: 8/50, iter: 200/834, loss: 0.38427, lr: 1.435353, top1: 0.49583, throughput: 312.14 | 2022-04-11 02:06:41.342 [rank:4] [train], epoch: 8/50, iter: 200/834, loss: 0.37915, lr: 1.435353, top1: 0.50766, throughput: 311.93 | 2022-04-11 02:06:41.350 [rank:2] [train], epoch: 8/50, iter: 200/834, loss: 0.37915, lr: 1.435353, top1: 0.50604, throughput: 312.00 | 2022-04-11 02:06:41.368 [rank:5] [train], epoch: 8/50, iter: 200/834, loss: 0.38004, lr: 1.435353, top1: 0.50682, throughput: 312.55 | 2022-04-11 02:06:41.276 [rank:7] [train], epoch: 8/50, iter: 300/834, loss: 0.37718, lr: 1.432470, top1: 0.50922, throughput: 312.71 | 2022-04-11 02:07:42.732 [rank:2] [train], epoch: 8/50, iter: 300/834, loss: 0.37883, lr: 1.432470, top1: 0.51094, throughput: 312.63 | 2022-04-11 02:07:42.782 [rank:3] [train], epoch: 8/50, iter: 300/834, loss: 0.38113, lr: 1.432470, top1: 0.50141, throughput: 312.50 | 2022-04-11 02:07:42.783 [rank:6] [train], epoch: 8/50, iter: 300/834, loss: 0.37732, lr: 1.432470, top1: 0.51104, throughput: 312.19 | 2022-04-11 02:07:42.795 [rank:4] [train], epoch: 8/50, iter: 300/834, loss: 0.37655, lr: 1.432470, top1: 0.51078, throughput: 312.38 | 2022-04-11 02:07:42.813 [rank:5] [train], epoch: 8/50, iter: 300/834, loss: 0.38431, lr: 1.432470, top1: 0.49823, throughput: 311.94 | 2022-04-11 02:07:42.827 [rank:0] [train], epoch: 8/50, iter: 300/834, loss: 0.38186, lr: 1.432470, top1: 0.50161, throughput: 312.15 | 2022-04-11 02:07:42.829 [rank:1] [train], epoch: 8/50, iter: 300/834, loss: 0.38064, lr: 1.432470, top1: 0.50240, throughput: 311.99 | 2022-04-11 02:07:42.834 [rank:6] [train], epoch: 8/50, iter: 400/834, loss: 0.38032, lr: 1.429550, top1: 0.50766, throughput: 312.03 | 2022-04-11 02:08:44.327 [rank:1] [train], epoch: 8/50, iter: 400/834, loss: 0.37782, lr: 1.429550, top1: 0.51078, throughput: 312.14 | 2022-04-11 02:08:44.345 [rank:7] [train], epoch: 8/50, iter: 400/834, loss: 0.37726, lr: 1.429550, top1: 0.51120, throughput: 311.54 | 2022-04-11 02:08:44.360 [rank:5] [train], epoch: 8/50, iter: 400/834, loss: 0.38004, lr: 1.429550, top1: 0.50255, throughput: 312.02 | 2022-04-11 02:08:44.361 [rank:4] [train], epoch: 8/50, iter: 400/834, loss: 0.37957, lr: 1.429550, top1: 0.50417, throughput: 311.86 | 2022-04-11 02:08:44.379 [rank:3] [train], epoch: 8/50, iter: 400/834, loss: 0.38105, lr: 1.429550, top1: 0.50255, throughput: 311.70 | 2022-04-11 02:08:44.381 [rank:2] [train], epoch: 8/50, iter: 400/834, loss: 0.37896, lr: 1.429550, top1: 0.50797, throughput: 311.65 | 2022-04-11 02:08:44.389 [rank:0] [train], epoch: 8/50, iter: 400/834, loss: 0.38045, lr: 1.429550, top1: 0.50323, throughput: 312.26 | 2022-04-11 02:08:44.315 [rank:1] [train], epoch: 8/50, iter: 500/834, loss: 0.37922, lr: 1.426592, top1: 0.50734, throughput: 312.29 | 2022-04-11 02:09:45.826 [rank:7] [train], epoch: 8/50, iter: 500/834, loss: 0.38125, lr: 1.426592, top1: 0.50776, throughput: 312.27 | 2022-04-11 02:09:45.845 [rank:6] [train], epoch: 8/50, iter: 500/834, loss: 0.37935, lr: 1.426592, top1: 0.50151, throughput: 312.10 | 2022-04-11 02:09:45.846 [rank:2] [train], epoch: 8/50, iter: 500/834, loss: 0.37684, lr: 1.426592, top1: 0.51547, throughput: 312.36 | 2022-04-11 02:09:45.857 [rank:0] [train], epoch: 8/50, iter: 500/834, loss: 0.38119, lr: 1.426592, top1: 0.50687, throughput: 311.96 | 2022-04-11 02:09:45.861 [rank:4] [train], epoch: 8/50, iter: 500/834, loss: 0.38045, lr: 1.426592, top1: 0.50198, throughput: 312.28 | 2022-04-11 02:09:45.863 [rank:5] [train], epoch: 8/50, iter: 500/834, loss: 0.37994, lr: 1.426592, top1: 0.50594, throughput: 312.11 | 2022-04-11 02:09:45.878 [rank:3] [train], epoch: 8/50, iter: 500/834, loss: 0.37724, lr: 1.426592, top1: 0.50708, throughput: 311.99 | 2022-04-11 02:09:45.922 [rank:3] [train], epoch: 8/50, iter: 600/834, loss: 0.38079, lr: 1.423597, top1: 0.50125, throughput: 313.59 | 2022-04-11 02:10:47.149 [rank:4] [train], epoch: 8/50, iter: 600/834, loss: 0.38265, lr: 1.423597, top1: 0.50297, throughput: 313.23 | 2022-04-11 02:10:47.160 [rank:6] [train], epoch: 8/50, iter: 600/834, loss: 0.37881, lr: 1.423597, top1: 0.51031, throughput: 313.14 | 2022-04-11 02:10:47.160 [rank:0] [train], epoch: 8/50, iter: 600/834, loss: 0.37697, lr: 1.423597, top1: 0.51177, throughput: 313.17 | 2022-04-11 02:10:47.170 [rank:1] [train], epoch: 8/50, iter: 600/834, loss: 0.37773, lr: 1.423597, top1: 0.50563, throughput: 312.98 | 2022-04-11 02:10:47.171 [rank:5] [train], epoch: 8/50, iter: 600/834, loss: 0.38080, lr: 1.423597, top1: 0.50375, throughput: 313.15 | 2022-04-11 02:10:47.190 [rank:2] [train], epoch: 8/50, iter: 600/834, loss: 0.37727, lr: 1.423597, top1: 0.51365, throughput: 312.84 | 2022-04-11 02:10:47.231 [rank:7] [train], epoch: 8/50, iter: 600/834, loss: 0.37873, lr: 1.423597, top1: 0.50505, throughput: 312.75 | 2022-04-11 02:10:47.236 [rank:5] [train], epoch: 8/50, iter: 700/834, loss: 0.37723, lr: 1.420565, top1: 0.50766, throughput: 311.45 | 2022-04-11 02:11:48.837 [rank:6] [train], epoch: 8/50, iter: 700/834, loss: 0.37861, lr: 1.420565, top1: 0.50552, throughput: 311.21 | 2022-04-11 02:11:48.855 [rank:7] [train], epoch: 8/50, iter: 700/834, loss: 0.37777, lr: 1.420565, top1: 0.51172, throughput: 311.57 | 2022-04-11 02:11:48.859 [rank:4] [train], epoch: 8/50, iter: 700/834, loss: 0.37659, lr: 1.420565, top1: 0.51271, throughput: 311.00 | 2022-04-11 02:11:48.896 [rank:3] [train], epoch: 8/50, iter: 700/834, loss: 0.37845, lr: 1.420565, top1: 0.51464, throughput: 310.90 | 2022-04-11 02:11:48.905 [rank:2] [train], epoch: 8/50, iter: 700/834, loss: 0.37887, lr: 1.420565, top1: 0.50609, throughput: 311.26 | 2022-04-11 02:11:48.916 [rank:0] [train], epoch: 8/50, iter: 700/834, loss: 0.37818, lr: 1.420565, top1: 0.50786, throughput: 310.89 | 2022-04-11 02:11:48.928 [rank:1] [train], epoch: 8/50, iter: 700/834, loss: 0.37726, lr: 1.420565, top1: 0.50865, throughput: 310.87 | 2022-04-11 02:11:48.933 [rank:4] [train], epoch: 8/50, iter: 800/834, loss: 0.37652, lr: 1.417496, top1: 0.51521, throughput: 313.19 | 2022-04-11 02:12:50.201 [rank:7] [train], epoch: 8/50, iter: 800/834, loss: 0.38103, lr: 1.417496, top1: 0.51057, throughput: 312.97 | 2022-04-11 02:12:50.207 [rank:6] [train], epoch: 8/50, iter: 800/834, loss: 0.38026, lr: 1.417496, top1: 0.50307, throughput: 312.93 | 2022-04-11 02:12:50.211 [rank:0] [train], epoch: 8/50, iter: 800/834, loss: 0.37828, lr: 1.417496, top1: 0.50844, throughput: 313.23 | 2022-04-11 02:12:50.225 [rank:5] [train], epoch: 8/50, iter: 800/834, loss: 0.37755, lr: 1.417496, top1: 0.50854, throughput: 312.64 | 2022-04-11 02:12:50.249 [rank:3] [train], epoch: 8/50, iter: 800/834, loss: 0.38016, lr: 1.417496, top1: 0.50474, throughput: 312.98 | 2022-04-11 02:12:50.250 [rank:1] [train], epoch: 8/50, iter: 800/834, loss: 0.37790, lr: 1.417496, top1: 0.50771, throughput: 312.92 | 2022-04-11 02:12:50.291 [rank:2] [train], epoch: 8/50, iter: 800/834, loss: 0.37685, lr: 1.417496, top1: 0.51302, throughput: 312.66 | 2022-04-11 02:12:50.324 [rank:4] [train], epoch: 8/50, iter: 834/834, loss: 0.37995, lr: 1.416444, top1: 0.50230, throughput: 311.46 | 2022-04-11 02:13:11.160 [rank:2] [train], epoch: 8/50, iter: 834/834, loss: 0.37695, lr: 1.416444, top1: 0.50873, throughput: 313.16 | 2022-04-11 02:13:11.169 [rank:5] [train], epoch: 8/50, iter: 834/834, loss: 0.37829, lr: 1.416444, top1: 0.50965, throughput: 311.98 | 2022-04-11 02:13:11.173 [rank:1] [train], epoch: 8/50, iter: 834/834, loss: 0.37863, lr: 1.416444, top1: 0.50383, throughput: 312.50 | 2022-04-11 02:13:11.180 [rank:3] [train], epoch: 8/50, iter: 834/834, loss: 0.37291, lr: 1.416444, top1: 0.51562, throughput: 311.89 | 2022-04-11 02:13:11.180 [rank:0] [train], epoch: 8/50, iter: 834/834, loss: 0.38120, lr: 1.416444, top1: 0.50276, throughput: 311.45 | 2022-04-11 02:13:11.185 [rank:6] [train], epoch: 8/50, iter: 834/834, loss: 0.37865, lr: 1.416444, top1: 0.49786, throughput: 311.02 | 2022-04-11 02:13:11.201 [rank:7] [train], epoch: 8/50, iter: 834/834, loss: 0.37520, lr: 1.416444, top1: 0.52037, throughput: 310.72 | 2022-04-11 02:13:11.216 [rank:0] [eval], epoch: 8/50, iter: 125/125, loss: 0.00000, lr: 1.416444, top1: 0.51328, throughput: 485.14 | 2022-04-11 02:13:24.068 [rank:2] [eval], epoch: 8/50, iter: 125/125, loss: 0.00000, lr: 1.416444, top1: 0.50272, throughput: 484.25 | 2022-04-11 02:13:24.076 [rank:6] [eval], epoch: 8/50, iter: 125/125, loss: 0.00000, lr: 1.416444, top1: 0.50640, throughput: 485.25 | 2022-04-11 02:13:24.080 [rank:7] [eval], epoch: 8/50, iter: 125/125, loss: 0.00000, lr: 1.416444, top1: 0.51200, throughput: 485.75 | 2022-04-11 02:13:24.083 [rank:4] [eval], epoch: 8/50, iter: 125/125, loss: 0.00000, lr: 1.416444, top1: 0.50016, throughput: 483.62 | 2022-04-11 02:13:24.084 [rank:1] [eval], epoch: 8/50, iter: 125/125, loss: 0.00000, lr: 1.416444, top1: 0.51728, throughput: 483.93 | 2022-04-11 02:13:24.095 [rank:5] [eval], epoch: 8/50, iter: 125/125, loss: 0.00000, lr: 1.416444, top1: 0.49600, throughput: 483.22 | 2022-04-11 02:13:24.107 [rank:3] [eval], epoch: 8/50, iter: 125/125, loss: 0.00000, lr: 1.416444, top1: 0.50512, throughput: 482.96 | 2022-04-11 02:13:24.121 [rank:1] [train], epoch: 9/50, iter: 100/834, loss: 0.37444, lr: 1.413325, top1: 0.51615, throughput: 314.25 | 2022-04-11 02:14:25.194 [rank:0] [train], epoch: 9/50, iter: 100/834, loss: 0.37195, lr: 1.413325, top1: 0.52078, throughput: 314.05 | 2022-04-11 02:14:25.205 [rank:5] [train], epoch: 9/50, iter: 100/834, loss: 0.37390, lr: 1.413325, top1: 0.51635, throughput: 314.19 | 2022-04-11 02:14:25.216 [rank:6] [train], epoch: 9/50, iter: 100/834, loss: 0.37385, lr: 1.413325, top1: 0.51724, throughput: 314.05 | 2022-04-11 02:14:25.218 [rank:2] [train], epoch: 9/50, iter: 100/834, loss: 0.37008, lr: 1.413325, top1: 0.52354, throughput: 313.85 | 2022-04-11 02:14:25.251 [rank:3] [train], epoch: 9/50, iter: 100/834, loss: 0.36954, lr: 1.413325, top1: 0.52453, throughput: 314.07 | 2022-04-11 02:14:25.255 [rank:4] [train], epoch: 9/50, iter: 100/834, loss: 0.36902, lr: 1.413325, top1: 0.52755, throughput: 313.84 | 2022-04-11 02:14:25.260 [rank:7] [train], epoch: 9/50, iter: 100/834, loss: 0.37065, lr: 1.413325, top1: 0.52125, throughput: 314.19 | 2022-04-11 02:14:25.193 [rank:5] [train], epoch: 9/50, iter: 200/834, loss: 0.37229, lr: 1.410170, top1: 0.51786, throughput: 312.66 | 2022-04-11 02:15:26.624 [rank:6] [train], epoch: 9/50, iter: 200/834, loss: 0.37336, lr: 1.410170, top1: 0.51240, throughput: 312.43 | 2022-04-11 02:15:26.671 [rank:1] [train], epoch: 9/50, iter: 200/834, loss: 0.37092, lr: 1.410170, top1: 0.52062, throughput: 312.26 | 2022-04-11 02:15:26.680 [rank:0] [train], epoch: 9/50, iter: 200/834, loss: 0.36844, lr: 1.410170, top1: 0.52182, throughput: 312.29 | 2022-04-11 02:15:26.686 [rank:2] [train], epoch: 9/50, iter: 200/834, loss: 0.37229, lr: 1.410170, top1: 0.51823, throughput: 312.52 | 2022-04-11 02:15:26.687 [rank:7] [train], epoch: 9/50, iter: 200/834, loss: 0.37077, lr: 1.410170, top1: 0.52151, throughput: 312.34 | 2022-04-11 02:15:26.663 [rank:3] [train], epoch: 9/50, iter: 200/834, loss: 0.37262, lr: 1.410170, top1: 0.51125, throughput: 312.33 | 2022-04-11 02:15:26.729 [rank:4] [train], epoch: 9/50, iter: 200/834, loss: 0.37130, lr: 1.410170, top1: 0.51750, throughput: 312.34 | 2022-04-11 02:15:26.732 [rank:4] [train], epoch: 9/50, iter: 300/834, loss: 0.37627, lr: 1.406978, top1: 0.51177, throughput: 312.64 | 2022-04-11 02:16:28.145 [rank:2] [train], epoch: 9/50, iter: 300/834, loss: 0.37798, lr: 1.406978, top1: 0.50885, throughput: 312.29 | 2022-04-11 02:16:28.167 [rank:7] [train], epoch: 9/50, iter: 300/834, loss: 0.37471, lr: 1.406978, top1: 0.51286, throughput: 312.15 | 2022-04-11 02:16:28.172 [rank:6] [train], epoch: 9/50, iter: 300/834, loss: 0.37278, lr: 1.406978, top1: 0.51635, throughput: 312.12 | 2022-04-11 02:16:28.184 [rank:0] [train], epoch: 9/50, iter: 300/834, loss: 0.37257, lr: 1.406978, top1: 0.51630, throughput: 312.06 | 2022-04-11 02:16:28.213 [rank:3] [train], epoch: 9/50, iter: 300/834, loss: 0.37393, lr: 1.406978, top1: 0.51531, throughput: 312.27 | 2022-04-11 02:16:28.215 [rank:5] [train], epoch: 9/50, iter: 300/834, loss: 0.37664, lr: 1.406978, top1: 0.51234, throughput: 311.73 | 2022-04-11 02:16:28.215 [rank:1] [train], epoch: 9/50, iter: 300/834, loss: 0.37202, lr: 1.406978, top1: 0.52104, throughput: 311.81 | 2022-04-11 02:16:28.256 [rank:4] [train], epoch: 9/50, iter: 400/834, loss: 0.37241, lr: 1.403750, top1: 0.51906, throughput: 313.32 | 2022-04-11 02:17:29.424 [rank:1] [train], epoch: 9/50, iter: 400/834, loss: 0.36997, lr: 1.403750, top1: 0.52547, throughput: 313.62 | 2022-04-11 02:17:29.476 [rank:0] [train], epoch: 9/50, iter: 400/834, loss: 0.37057, lr: 1.403750, top1: 0.51896, throughput: 313.40 | 2022-04-11 02:17:29.477 [rank:2] [train], epoch: 9/50, iter: 400/834, loss: 0.37264, lr: 1.403750, top1: 0.51620, throughput: 313.10 | 2022-04-11 02:17:29.489 [rank:5] [train], epoch: 9/50, iter: 400/834, loss: 0.37393, lr: 1.403750, top1: 0.51599, throughput: 313.34 | 2022-04-11 02:17:29.490 [rank:3] [train], epoch: 9/50, iter: 400/834, loss: 0.37332, lr: 1.403750, top1: 0.51885, throughput: 313.23 | 2022-04-11 02:17:29.510 [rank:6] [train], epoch: 9/50, iter: 400/834, loss: 0.37127, lr: 1.403750, top1: 0.51875, throughput: 313.08 | 2022-04-11 02:17:29.511 [rank:7] [train], epoch: 9/50, iter: 400/834, loss: 0.37363, lr: 1.403750, top1: 0.52062, throughput: 312.97 | 2022-04-11 02:17:29.519 [rank:2] [train], epoch: 9/50, iter: 500/834, loss: 0.37470, lr: 1.400486, top1: 0.51594, throughput: 314.08 | 2022-04-11 02:18:30.619 [rank:1] [train], epoch: 9/50, iter: 500/834, loss: 0.37292, lr: 1.400486, top1: 0.51214, throughput: 313.90 | 2022-04-11 02:18:30.642 [rank:4] [train], epoch: 9/50, iter: 500/834, loss: 0.37380, lr: 1.400486, top1: 0.51604, throughput: 313.61 | 2022-04-11 02:18:30.648 [rank:0] [train], epoch: 9/50, iter: 500/834, loss: 0.36949, lr: 1.400486, top1: 0.52057, throughput: 313.81 | 2022-04-11 02:18:30.659 [rank:6] [train], epoch: 9/50, iter: 500/834, loss: 0.37070, lr: 1.400486, top1: 0.52109, throughput: 313.98 | 2022-04-11 02:18:30.661 [rank:5] [train], epoch: 9/50, iter: 500/834, loss: 0.37464, lr: 1.400486, top1: 0.51865, throughput: 313.82 | 2022-04-11 02:18:30.672 [rank:3] [train], epoch: 9/50, iter: 500/834, loss: 0.37049, lr: 1.400486, top1: 0.52120, throughput: 313.86 | 2022-04-11 02:18:30.685 [rank:7] [train], epoch: 9/50, iter: 500/834, loss: 0.37238, lr: 1.400486, top1: 0.51849, throughput: 313.86 | 2022-04-11 02:18:30.693 [rank:6] [train], epoch: 9/50, iter: 600/834, loss: 0.37116, lr: 1.397186, top1: 0.52344, throughput: 313.17 | 2022-04-11 02:19:31.969 [rank:1] [train], epoch: 9/50, iter: 600/834, loss: 0.37101, lr: 1.397186, top1: 0.52266, throughput: 313.05 | 2022-04-11 02:19:31.975 [rank:3] [train], epoch: 9/50, iter: 600/834, loss: 0.36930, lr: 1.397186, top1: 0.52312, throughput: 313.14 | 2022-04-11 02:19:31.999 [rank:4] [train], epoch: 9/50, iter: 600/834, loss: 0.37272, lr: 1.397186, top1: 0.51839, throughput: 312.89 | 2022-04-11 02:19:32.012 [rank:7] [train], epoch: 9/50, iter: 600/834, loss: 0.37145, lr: 1.397186, top1: 0.52010, throughput: 313.11 | 2022-04-11 02:19:32.013 [rank:0] [train], epoch: 9/50, iter: 600/834, loss: 0.37296, lr: 1.397186, top1: 0.51839, throughput: 312.87 | 2022-04-11 02:19:32.026 [rank:2] [train], epoch: 9/50, iter: 600/834, loss: 0.37229, lr: 1.397186, top1: 0.51698, throughput: 312.67 | 2022-04-11 02:19:32.027 [rank:5] [train], epoch: 9/50, iter: 600/834, loss: 0.37329, lr: 1.397186, top1: 0.51490, throughput: 312.87 | 2022-04-11 02:19:32.038 [rank:5] [train], epoch: 9/50, iter: 700/834, loss: 0.37032, lr: 1.393851, top1: 0.52203, throughput: 312.51 | 2022-04-11 02:20:33.476 [rank:7] [train], epoch: 9/50, iter: 700/834, loss: 0.37083, lr: 1.393851, top1: 0.52068, throughput: 312.33 | 2022-04-11 02:20:33.487 [rank:2] [train], epoch: 9/50, iter: 700/834, loss: 0.37172, lr: 1.393851, top1: 0.51974, throughput: 312.29 | 2022-04-11 02:20:33.508 [rank:3] [train], epoch: 9/50, iter: 700/834, loss: 0.36972, lr: 1.393851, top1: 0.52365, throughput: 312.12 | 2022-04-11 02:20:33.513 [rank:4] [train], epoch: 9/50, iter: 700/834, loss: 0.37384, lr: 1.393851, top1: 0.51818, throughput: 312.16 | 2022-04-11 02:20:33.519 [rank:6] [train], epoch: 9/50, iter: 700/834, loss: 0.37401, lr: 1.393851, top1: 0.51401, throughput: 311.88 | 2022-04-11 02:20:33.532 [rank:1] [train], epoch: 9/50, iter: 700/834, loss: 0.37112, lr: 1.393851, top1: 0.52005, throughput: 311.87 | 2022-04-11 02:20:33.538 [rank:0] [train], epoch: 9/50, iter: 700/834, loss: 0.37166, lr: 1.393851, top1: 0.52307, throughput: 312.03 | 2022-04-11 02:20:33.559 [rank:6] [train], epoch: 9/50, iter: 800/834, loss: 0.37056, lr: 1.390479, top1: 0.51766, throughput: 313.58 | 2022-04-11 02:21:34.760 [rank:4] [train], epoch: 9/50, iter: 800/834, loss: 0.37296, lr: 1.390479, top1: 0.52250, throughput: 313.36 | 2022-04-11 02:21:34.791 [rank:5] [train], epoch: 9/50, iter: 800/834, loss: 0.36792, lr: 1.390479, top1: 0.52661, throughput: 313.10 | 2022-04-11 02:21:34.799 [rank:7] [train], epoch: 9/50, iter: 800/834, loss: 0.36942, lr: 1.390479, top1: 0.52365, throughput: 313.11 | 2022-04-11 02:21:34.807 [rank:0] [train], epoch: 9/50, iter: 800/834, loss: 0.36922, lr: 1.390479, top1: 0.52109, throughput: 313.34 | 2022-04-11 02:21:34.835 [rank:1] [train], epoch: 9/50, iter: 800/834, loss: 0.37244, lr: 1.390479, top1: 0.51870, throughput: 313.13 | 2022-04-11 02:21:34.855 [rank:3] [train], epoch: 9/50, iter: 800/834, loss: 0.37310, lr: 1.390479, top1: 0.51896, throughput: 312.86 | 2022-04-11 02:21:34.882 [rank:2] [train], epoch: 9/50, iter: 800/834, loss: 0.37297, lr: 1.390479, top1: 0.51823, throughput: 312.67 | 2022-04-11 02:21:34.915 [rank:4] [train], epoch: 9/50, iter: 834/834, loss: 0.37238, lr: 1.389325, top1: 0.51915, throughput: 312.49 | 2022-04-11 02:21:55.681 [rank:6] [train], epoch: 9/50, iter: 834/834, loss: 0.37072, lr: 1.389325, top1: 0.52145, throughput: 312.01 | 2022-04-11 02:21:55.682 [rank:7] [train], epoch: 9/50, iter: 834/834, loss: 0.36892, lr: 1.389325, top1: 0.52849, throughput: 312.64 | 2022-04-11 02:21:55.687 [rank:2] [train], epoch: 9/50, iter: 834/834, loss: 0.36969, lr: 1.389325, top1: 0.52528, throughput: 314.25 [rank:5] [train], epoch: 9/50, iter: 834/834, loss: 0.36987, lr: 1.389325, top1: 0.52696, throughput: 312.47 | 2022-04-11 02:21:55.690 | 2022-04-11 02:21:55.689 [rank:1] [train], epoch: 9/50, iter: 834/834, loss: 0.36882, lr: 1.389325, top1: 0.52129, throughput: 313.28 | 2022-04-11 02:21:55.693 [rank:3] [train], epoch: 9/50, iter: 834/834, loss: 0.36972, lr: 1.389325, top1: 0.51746, throughput: 313.67 | 2022-04-11 02:21:55.694 [rank:0] [train], epoch: 9/50, iter: 834/834, loss: 0.37628, lr: 1.389325, top1: 0.51103, throughput: 312.75 | 2022-04-11 02:21:55.707 [rank:0] [eval], epoch: 9/50, iter: 125/125, loss: 0.00000, lr: 1.389325, top1: 0.53792, throughput: 487.01 | 2022-04-11 02:22:08.541 [rank:4] [eval], epoch: 9/50, iter: 125/125, loss: 0.00000, lr: 1.389325, top1: 0.53120, throughput: 485.67 | 2022-04-11 02:22:08.550 [rank:7] [eval], epoch: 9/50, iter: 125/125, loss: 0.00000, lr: 1.389325, top1: 0.53680, throughput: 485.78 | 2022-04-11 02:22:08.553 [rank:6] [eval], epoch: 9/50, iter: 125/125, loss: 0.00000, lr: 1.389325, top1: 0.51808, throughput: 485.31 | 2022-04-11 02:22:08.560 [rank:2] [eval], epoch: 9/50, iter: 125/125, loss: 0.00000, lr: 1.389325, top1: 0.51904, throughput: 485.48 | 2022-04-11 02:22:08.562 [rank:1] [eval], epoch: 9/50, iter: 125/125, loss: 0.00000, lr: 1.389325, top1: 0.52848, throughput: 484.53 | 2022-04-11 02:22:08.592 [rank:3] [eval], epoch: 9/50, iter: 125/125, loss: 0.00000, lr: 1.389325, top1: 0.52464, throughput: 484.52 | 2022-04-11 02:22:08.593 [rank:5] [eval], epoch: 9/50, iter: 125/125, loss: 0.00000, lr: 1.389325, top1: 0.51264, throughput: 484.00 | 2022-04-11 02:22:08.603 [rank:7] [train], epoch: 10/50, iter: 100/834, loss: 0.36724, lr: 1.385907, top1: 0.52714, throughput: 313.24 | 2022-04-11 02:23:09.848 [rank:6] [train], epoch: 10/50, iter: 100/834, loss: 0.36563, lr: 1.385907, top1: 0.53068, throughput: 313.22 | 2022-04-11 02:23:09.860 [rank:5] [train], epoch: 10/50, iter: 100/834, loss: 0.36199, lr: 1.385907, top1: 0.54010, throughput: 313.41 | 2022-04-11 02:23:09.864 [rank:2] [train], epoch: 10/50, iter: 100/834, loss: 0.35987, lr: 1.385907, top1: 0.53938, throughput: 313.17 | 2022-04-11 02:23:09.872 [rank:4] [train], epoch: 10/50, iter: 100/834, loss: 0.36325, lr: 1.385907, top1: 0.53333, throughput: 313.05 | 2022-04-11 02:23:09.881 [rank:0] [train], epoch: 10/50, iter: 100/834, loss: 0.36438, lr: 1.385907, top1: 0.53146, throughput: 312.93 | 2022-04-11 02:23:09.897 [rank:1] [train], epoch: 10/50, iter: 100/834, loss: 0.36608, lr: 1.385907, top1: 0.52630, throughput: 313.16 | 2022-04-11 02:23:09.902 [rank:3] [train], epoch: 10/50, iter: 100/834, loss: 0.36442, lr: 1.385907, top1: 0.53234, throughput: 313.12 | 2022-04-11 02:23:09.912 [rank:0] [train], epoch: 10/50, iter: 200/834, loss: 0.36499, lr: 1.382453, top1: 0.53312, throughput: 315.64 | 2022-04-11 02:24:10.726 [rank:1] [train], epoch: 10/50, iter: 200/834, loss: 0.36590, lr: 1.382453, top1: 0.52880, throughput: 315.63 | 2022-04-11 02:24:10.733 [rank:5] [train], epoch: 10/50, iter: 200/834, loss: 0.36691, lr: 1.382453, top1: 0.52781, throughput: 315.38 | 2022-04-11 02:24:10.743 [rank:2] [train], epoch: 10/50, iter: 200/834, loss: 0.36485, lr: 1.382453, top1: 0.53078, throughput: 315.35 | 2022-04-11 02:24:10.757 [rank:6] [train], epoch: 10/50, iter: 200/834, loss: 0.36580, lr: 1.382453, top1: 0.53047, throughput: 315.19 | 2022-04-11 02:24:10.775 [rank:3] [train], epoch: 10/50, iter: 200/834, loss: 0.36985, lr: 1.382453, top1: 0.52104, throughput: 315.45 | 2022-04-11 02:24:10.778 [rank:4] [train], epoch: 10/50, iter: 200/834, loss: 0.36532, lr: 1.382453, top1: 0.53234, throughput: 315.20 | 2022-04-11 02:24:10.795 [rank:7] [train], epoch: 10/50, iter: 200/834, loss: 0.36879, lr: 1.382453, top1: 0.52458, throughput: 314.90 | 2022-04-11 02:24:10.819 [rank:6] [train], epoch: 10/50, iter: 300/834, loss: 0.36219, lr: 1.378965, top1: 0.53573, throughput: 312.37 | 2022-04-11 02:25:12.241 [rank:5] [train], epoch: 10/50, iter: 300/834, loss: 0.36642, lr: 1.378965, top1: 0.52750, throughput: 312.13 | 2022-04-11 02:25:12.255 [rank:2] [train], epoch: 10/50, iter: 300/834, loss: 0.36529, lr: 1.378965, top1: 0.52927, throughput: 312.06 | 2022-04-11 02:25:12.283 [rank:1] [train], epoch: 10/50, iter: 300/834, loss: 0.36662, lr: 1.378965, top1: 0.52943, throughput: 311.87 | 2022-04-11 02:25:12.298 [rank:4] [train], epoch: 10/50, iter: 300/834, loss: 0.36541, lr: 1.378965, top1: 0.53068, throughput: 312.08 | 2022-04-11 02:25:12.318 [rank:3] [train], epoch: 10/50, iter: 300/834, loss: 0.36211, lr: 1.378965, top1: 0.53443, throughput: 311.96 | 2022-04-11 02:25:12.325 [rank:7] [train], epoch: 10/50, iter: 300/834, loss: 0.36725, lr: 1.378965, top1: 0.52922, throughput: 312.09 | 2022-04-11 02:25:12.339 [rank:0] [train], epoch: 10/50, iter: 300/834, loss: 0.36622, lr: 1.378965, top1: 0.53010, throughput: 311.59 | 2022-04-11 02:25:12.346 [rank:6] [train], epoch: 10/50, iter: 400/834, loss: 0.36443, lr: 1.375441, top1: 0.53062, throughput: 314.01 | 2022-04-11 02:26:13.385 [rank:7] [train], epoch: 10/50, iter: 400/834, loss: 0.36476, lr: 1.375441, top1: 0.53042, throughput: 314.27 | 2022-04-11 02:26:13.433 [rank:2] [train], epoch: 10/50, iter: 400/834, loss: 0.36575, lr: 1.375441, top1: 0.53042, throughput: 313.89 | 2022-04-11 02:26:13.450 [rank:4] [train], epoch: 10/50, iter: 400/834, loss: 0.36667, lr: 1.375441, top1: 0.52729, throughput: 313.90 | 2022-04-11 02:26:13.483 [rank:5] [train], epoch: 10/50, iter: 400/834, loss: 0.36925, lr: 1.375441, top1: 0.52010, throughput: 313.58 | 2022-04-11 02:26:13.484 [rank:0] [train], epoch: 10/50, iter: 400/834, loss: 0.36818, lr: 1.375441, top1: 0.52583, throughput: 313.97 | 2022-04-11 02:26:13.498 [rank:3] [train], epoch: 10/50, iter: 400/834, loss: 0.36428, lr: 1.375441, top1: 0.53130, throughput: 314.25 | 2022-04-11 02:26:13.423 [rank:1] [train], epoch: 10/50, iter: 400/834, loss: 0.36512, lr: 1.375441, top1: 0.52703, throughput: 313.57 | 2022-04-11 02:26:13.528 [rank:5] [train], epoch: 10/50, iter: 500/834, loss: 0.37039, lr: 1.371884, top1: 0.52234, throughput: 311.90 | 2022-04-11 02:27:15.043 [rank:2] [train], epoch: 10/50, iter: 500/834, loss: 0.36615, lr: 1.371884, top1: 0.52964, throughput: 311.57 | 2022-04-11 02:27:15.073 [rank:0] [train], epoch: 10/50, iter: 500/834, loss: 0.36670, lr: 1.371884, top1: 0.52766, throughput: 311.81 | 2022-04-11 02:27:15.074 [rank:1] [train], epoch: 10/50, iter: 500/834, loss: 0.36509, lr: 1.371884, top1: 0.53297, throughput: 311.89 | 2022-04-11 02:27:15.088 [rank:6] [train], epoch: 10/50, iter: 500/834, loss: 0.36609, lr: 1.371884, top1: 0.53224, throughput: 311.16 | 2022-04-11 02:27:15.089 [rank:4] [train], epoch: 10/50, iter: 500/834, loss: 0.36904, lr: 1.371884, top1: 0.52542, throughput: 311.68 | 2022-04-11 02:27:15.086 [rank:3] [train], epoch: 10/50, iter: 500/834, loss: 0.36631, lr: 1.371884, top1: 0.53083, throughput: 311.15 | 2022-04-11 02:27:15.129 [rank:7] [train], epoch: 10/50, iter: 500/834, loss: 0.36968, lr: 1.371884, top1: 0.52365, throughput: 311.16 | 2022-04-11 02:27:15.138 [rank:1] [train], epoch: 10/50, iter: 600/834, loss: 0.36527, lr: 1.368292, top1: 0.52885, throughput: 312.95 | 2022-04-11 02:28:16.439 [rank:4] [train], epoch: 10/50, iter: 600/834, loss: 0.36756, lr: 1.368292, top1: 0.53016, throughput: 312.92 | 2022-04-11 02:28:16.443 [rank:2] [train], epoch: 10/50, iter: 600/834, loss: 0.36823, lr: 1.368292, top1: 0.52750, throughput: 312.85 | 2022-04-11 02:28:16.445 [rank:6] [train], epoch: 10/50, iter: 600/834, loss: 0.36400, lr: 1.368292, top1: 0.53458, throughput: 312.93 | 2022-04-11 02:28:16.445 [rank:5] [train], epoch: 10/50, iter: 600/834, loss: 0.36422, lr: 1.368292, top1: 0.53151, throughput: 312.45 | 2022-04-11 02:28:16.492 [rank:0] [train], epoch: 10/50, iter: 600/834, loss: 0.36695, lr: 1.368292, top1: 0.52615, throughput: 312.60 | 2022-04-11 02:28:16.494 [rank:3] [train], epoch: 10/50, iter: 600/834, loss: 0.36446, lr: 1.368292, top1: 0.53208, throughput: 312.85 | 2022-04-11 02:28:16.500 [rank:7] [train], epoch: 10/50, iter: 600/834, loss: 0.36391, lr: 1.368292, top1: 0.53625, throughput: 312.83 | 2022-04-11 02:28:16.514 [rank:6] [train], epoch: 10/50, iter: 700/834, loss: 0.36941, lr: 1.364666, top1: 0.52333, throughput: 313.78 | 2022-04-11 02:29:17.635 [rank:5] [train], epoch: 10/50, iter: 700/834, loss: 0.36906, lr: 1.364666, top1: 0.52344, throughput: 313.97 | 2022-04-11 02:29:17.644 [rank:1] [train], epoch: 10/50, iter: 700/834, loss: 0.36461, lr: 1.364666, top1: 0.53188, throughput: 313.45 | 2022-04-11 02:29:17.692 [rank:2] [train], epoch: 10/50, iter: 700/834, loss: 0.36356, lr: 1.364666, top1: 0.52979, throughput: 313.42 | 2022-04-11 02:29:17.705 [rank:0] [train], epoch: 10/50, iter: 700/834, loss: 0.36884, lr: 1.364666, top1: 0.51755, throughput: 314.04 | 2022-04-11 02:29:17.633 [rank:4] [train], epoch: 10/50, iter: 700/834, loss: 0.36938, lr: 1.364666, top1: 0.52703, throughput: 313.31 | 2022-04-11 02:29:17.723 [rank:7] [train], epoch: 10/50, iter: 700/834, loss: 0.36765, lr: 1.364666, top1: 0.52844, throughput: 313.58 | 2022-04-11 02:29:17.742 [rank:3] [train], epoch: 10/50, iter: 700/834, loss: 0.36655, lr: 1.364666, top1: 0.52823, throughput: 313.46 | 2022-04-11 02:29:17.752 [rank:6] [train], epoch: 10/50, iter: 800/834, loss: 0.36562, lr: 1.361006, top1: 0.53646, throughput: 311.72 | 2022-04-11 02:30:19.229 [rank:1] [train], epoch: 10/50, iter: 800/834, loss: 0.36667, lr: 1.361006, top1: 0.52641, throughput: 311.96 | 2022-04-11 02:30:19.238 [rank:5] [train], epoch: 10/50, iter: 800/834, loss: 0.36410, lr: 1.361006, top1: 0.52917, throughput: 311.66 | 2022-04-11 02:30:19.249 [rank:4] [train], epoch: 10/50, iter: 800/834, loss: 0.36672, lr: 1.361006, top1: 0.53260, throughput: 312.01 | 2022-04-11 02:30:19.261 [rank:7] [train], epoch: 10/50, iter: 800/834, loss: 0.36627, lr: 1.361006, top1: 0.53156, throughput: 312.09 | 2022-04-11 02:30:19.262 [rank:0] [train], epoch: 10/50, iter: 800/834, loss: 0.36745, lr: 1.361006, top1: 0.52771, throughput: 311.53 | 2022-04-11 02:30:19.264 [rank:2] [train], epoch: 10/50, iter: 800/834, loss: 0.36544, lr: 1.361006, top1: 0.53219, throughput: 311.83 | 2022-04-11 02:30:19.278 [rank:3] [train], epoch: 10/50, iter: 800/834, loss: 0.36568, lr: 1.361006, top1: 0.52901, throughput: 312.00 | 2022-04-11 02:30:19.290 [rank:6] [train], epoch: 10/50, iter: 834/834, loss: 0.36752, lr: 1.359754, top1: 0.52497, throughput: 312.84 | 2022-04-11 02:30:40.096 [rank:4] [train], epoch: 10/50, iter: 834/834, loss: 0.36892, lr: 1.359754, top1: 0.52145, throughput: 312.86 | 2022-04-11 02:30:40.126 [rank:7] [train], epoch: 10/50, iter: 834/834, loss: 0.36417, lr: 1.359754, top1: 0.54090, throughput: 312.80 | 2022-04-11 02:30:40.132 [rank:2] [train], epoch: 10/50, iter: 834/834, loss: 0.36636, lr: 1.359754, top1: 0.52865, throughput: 313.02 | 2022-04-11 02:30:40.133 [rank:1] [train], epoch: 10/50, iter: 834/834, loss: 0.36602, lr: 1.359754, top1: 0.53309, throughput: 312.40 | 2022-04-11 02:30:40.134 [rank:5] [train], epoch: 10/50, iter: 834/834, loss: 0.36399, lr: 1.359754, top1: 0.52773, throughput: 312.51[rank:3] [train], epoch: 10/50, iter: 834/834, loss: 0.36526, lr: 1.359754, top1: 0.52574, throughput: 313.13 | 2022-04-11 02:30:40.138| 2022-04-11 02:30:40.138 [rank:0] [train], epoch: 10/50, iter: 834/834, loss: 0.36792, lr: 1.359754, top1: 0.52405, throughput: 312.61 | 2022-04-11 02:30:40.147 [rank:0] [eval], epoch: 10/50, iter: 125/125, loss: 0.00000, lr: 1.359754, top1: 0.53792, throughput: 488.51 | 2022-04-11 02:30:52.941 [rank:4] [eval], epoch: 10/50, iter: 125/125, loss: 0.00000, lr: 1.359754, top1: 0.52816, throughput: 487.19 | 2022-04-11 02:30:52.954 [rank:5] [eval], epoch: 10/50, iter: 125/125, loss: 0.00000, lr: 1.359754, top1: 0.51664, throughput: 487.60 | 2022-04-11 02:30:52.955 [rank:7] [eval], epoch: 10/50, iter: 125/125, loss: 0.00000, lr: 1.359754, top1: 0.52912, throughput: 487.39 | 2022-04-11 02:30:52.956 [rank:2] [eval], epoch: 10/50, iter: 125/125, loss: 0.00000, lr: 1.359754, top1: 0.53040, throughput: 487.39 | 2022-04-11 02:30:52.956 [rank:6] [eval], epoch: 10/50, iter: 125/125, loss: 0.00000, lr: 1.359754, top1: 0.53248, throughput: 486.00 | 2022-04-11 02:30:52.956 [rank:1] [eval], epoch: 10/50, iter: 125/125, loss: 0.00000, lr: 1.359754, top1: 0.54480, throughput: 486.24 | 2022-04-11 02:30:52.988 [rank:3] [eval], epoch: 10/50, iter: 125/125, loss: 0.00000, lr: 1.359754, top1: 0.52128, throughput: 486.21 | 2022-04-11 02:30:52.992 [rank:4] [train], epoch: 11/50, iter: 100/834, loss: 0.36248, lr: 1.356049, top1: 0.53422, throughput: 313.22 | 2022-04-11 02:31:54.254 [rank:0] [train], epoch: 11/50, iter: 100/834, loss: 0.35933, lr: 1.356049, top1: 0.54026, throughput: 312.97 | 2022-04-11 02:31:54.289 [rank:3] [train], epoch: 11/50, iter: 100/834, loss: 0.35941, lr: 1.356049, top1: 0.54307, throughput: 313.22 | 2022-04-11 02:31:54.292 [rank:7] [train], epoch: 11/50, iter: 100/834, loss: 0.35691, lr: 1.356049, top1: 0.54625, throughput: 313.03 | 2022-04-11 02:31:54.292 [rank:1] [train], epoch: 11/50, iter: 100/834, loss: 0.35948, lr: 1.356049, top1: 0.53979, throughput: 313.09 | 2022-04-11 02:31:54.312 [rank:2] [train], epoch: 11/50, iter: 100/834, loss: 0.36327, lr: 1.356049, top1: 0.53479, throughput: 312.82 | 2022-04-11 02:31:54.334 [rank:6] [train], epoch: 11/50, iter: 100/834, loss: 0.35717, lr: 1.356049, top1: 0.54521, throughput: 312.74 | 2022-04-11 02:31:54.349 [rank:5] [train], epoch: 11/50, iter: 100/834, loss: 0.36260, lr: 1.356049, top1: 0.53625, throughput: 312.64 | 2022-04-11 02:31:54.367 [rank:6] [train], epoch: 11/50, iter: 200/834, loss: 0.36434, lr: 1.352311, top1: 0.53151, throughput: 313.25 | 2022-04-11 02:32:55.643 [rank:4] [train], epoch: 11/50, iter: 200/834, loss: 0.36295, lr: 1.352311, top1: 0.53505, throughput: 312.73 | 2022-04-11 02:32:55.648 [rank:7] [train], epoch: 11/50, iter: 200/834, loss: 0.36372, lr: 1.352311, top1: 0.53531, throughput: 312.92 | 2022-04-11 02:32:55.650 [rank:3] [train], epoch: 11/50, iter: 200/834, loss: 0.36040, lr: 1.352311, top1: 0.54115, throughput: 312.73 | 2022-04-11 02:32:55.686 [rank:0] [train], epoch: 11/50, iter: 200/834, loss: 0.36030, lr: 1.352311, top1: 0.54031, throughput: 312.67 | 2022-04-11 02:32:55.696 [rank:5] [train], epoch: 11/50, iter: 200/834, loss: 0.35981, lr: 1.352311, top1: 0.54203, throughput: 313.06 | 2022-04-11 02:32:55.697 [rank:1] [train], epoch: 11/50, iter: 200/834, loss: 0.35963, lr: 1.352311, top1: 0.54089, throughput: 312.73 | 2022-04-11 02:32:55.707 [rank:2] [train], epoch: 11/50, iter: 200/834, loss: 0.35490, lr: 1.352311, top1: 0.55141, throughput: 312.84 | 2022-04-11 02:32:55.708 [rank:7] [train], epoch: 11/50, iter: 300/834, loss: 0.36257, lr: 1.348540, top1: 0.53604, throughput: 311.81 | 2022-04-11 02:33:57.226 [rank:6] [train], epoch: 11/50, iter: 300/834, loss: 0.36051, lr: 1.348540, top1: 0.54172, throughput: 311.69 | 2022-04-11 02:33:57.241 [rank:0] [train], epoch: 11/50, iter: 300/834, loss: 0.36058, lr: 1.348540, top1: 0.53896, throughput: 311.88 | 2022-04-11 02:33:57.258 [rank:2] [train], epoch: 11/50, iter: 300/834, loss: 0.36315, lr: 1.348540, top1: 0.53516, throughput: 311.87 | 2022-04-11 02:33:57.272 [rank:3] [train], epoch: 11/50, iter: 300/834, loss: 0.36095, lr: 1.348540, top1: 0.53630, throughput: 311.69 | 2022-04-11 02:33:57.286 [rank:5] [train], epoch: 11/50, iter: 300/834, loss: 0.35997, lr: 1.348540, top1: 0.53870, throughput: 311.74 | 2022-04-11 02:33:57.287 [rank:1] [train], epoch: 11/50, iter: 300/834, loss: 0.36217, lr: 1.348540, top1: 0.53865, throughput: 311.75 | 2022-04-11 02:33:57.294 [rank:4] [train], epoch: 11/50, iter: 300/834, loss: 0.36182, lr: 1.348540, top1: 0.53635, throughput: 311.39 | 2022-04-11 02:33:57.308 [rank:2] [train], epoch: 11/50, iter: 400/834, loss: 0.36250, lr: 1.344735, top1: 0.53604, throughput: 313.82 | 2022-04-11 02:34:58.453 [rank:7] [train], epoch: 11/50, iter: 400/834, loss: 0.36146, lr: 1.344735, top1: 0.53938, throughput: 313.43 | 2022-04-11 02:34:58.484 [rank:3] [train], epoch: 11/50, iter: 400/834, loss: 0.36451, lr: 1.344735, top1: 0.53073, throughput: 313.65 | 2022-04-11 02:34:58.500 [rank:4] [train], epoch: 11/50, iter: 400/834, loss: 0.36153, lr: 1.344735, top1: 0.53557, throughput: 313.75 | 2022-04-11 02:34:58.502 [rank:1] [train], epoch: 11/50, iter: 400/834, loss: 0.36172, lr: 1.344735, top1: 0.53594, throughput: 313.67 | 2022-04-11 02:34:58.505 [rank:5] [train], epoch: 11/50, iter: 400/834, loss: 0.35990, lr: 1.344735, top1: 0.54177, throughput: 313.63 | 2022-04-11 02:34:58.505 [rank:6] [train], epoch: 11/50, iter: 400/834, loss: 0.36208, lr: 1.344735, top1: 0.53891, throughput: 313.33 | 2022-04-11 02:34:58.518 [rank:0] [train], epoch: 11/50, iter: 400/834, loss: 0.36207, lr: 1.344735, top1: 0.53250, throughput: 313.41 | 2022-04-11 02:34:58.521 [rank:6] [train], epoch: 11/50, iter: 500/834, loss: 0.36001, lr: 1.340898, top1: 0.54245, throughput: 313.92 | 2022-04-11 02:35:59.679 [rank:5] [train], epoch: 11/50, iter: 500/834, loss: 0.36214, lr: 1.340898, top1: 0.53656, throughput: 313.86 | 2022-04-11 02:35:59.680 [rank:1] [train], epoch: 11/50, iter: 500/834, loss: 0.36139, lr: 1.340898, top1: 0.54120, throughput: 313.75 | 2022-04-11 02:35:59.700 [rank:4] [train], epoch: 11/50, iter: 500/834, loss: 0.36258, lr: 1.340898, top1: 0.53698, throughput: 313.68 | 2022-04-11 02:35:59.711 [rank:3] [train], epoch: 11/50, iter: 500/834, loss: 0.36151, lr: 1.340898, top1: 0.53630, throughput: 313.54 | 2022-04-11 02:35:59.737 [rank:7] [train], epoch: 11/50, iter: 500/834, loss: 0.36090, lr: 1.340898, top1: 0.54031, throughput: 313.44 | 2022-04-11 02:35:59.741 [rank:0] [train], epoch: 11/50, iter: 500/834, loss: 0.36319, lr: 1.340898, top1: 0.53339, throughput: 313.98 | 2022-04-11 02:35:59.671 [rank:2] [train], epoch: 11/50, iter: 500/834, loss: 0.36153, lr: 1.340898, top1: 0.53349, throughput: 313.63 | 2022-04-11 02:35:59.672 [rank:5] [train], epoch: 11/50, iter: 600/834, loss: 0.36190, lr: 1.337029, top1: 0.53172, throughput: 313.72 | 2022-04-11 02:37:00.881 [rank:4] [train], epoch: 11/50, iter: 600/834, loss: 0.35911, lr: 1.337029, top1: 0.54380, throughput: 313.87 | 2022-04-11 02:37:00.882 [rank:1] [train], epoch: 11/50, iter: 600/834, loss: 0.36270, lr: 1.337029, top1: 0.53453, throughput: 313.73 | 2022-04-11 02:37:00.900 [rank:7] [train], epoch: 11/50, iter: 600/834, loss: 0.36093, lr: 1.337029, top1: 0.53719, throughput: 313.87 | 2022-04-11 02:37:00.912 [rank:2] [train], epoch: 11/50, iter: 600/834, loss: 0.35918, lr: 1.337029, top1: 0.54031, throughput: 313.50 | 2022-04-11 02:37:00.916 [rank:6] [train], epoch: 11/50, iter: 600/834, loss: 0.36034, lr: 1.337029, top1: 0.53635, throughput: 313.46 | 2022-04-11 02:37:00.931 [rank:3] [train], epoch: 11/50, iter: 600/834, loss: 0.36197, lr: 1.337029, top1: 0.53682, throughput: 313.64 | 2022-04-11 02:37:00.953 [rank:0] [train], epoch: 11/50, iter: 600/834, loss: 0.36071, lr: 1.337029, top1: 0.53880, throughput: 313.30 | 2022-04-11 02:37:00.954 [rank:0] [train], epoch: 11/50, iter: 700/834, loss: 0.36200, lr: 1.333127, top1: 0.53526, throughput: 314.57 | 2022-04-11 02:38:01.990 [rank:6] [train], epoch: 11/50, iter: 700/834, loss: 0.35917, lr: 1.333127, top1: 0.53813, throughput: 314.29 | 2022-04-11 02:38:02.021 [rank:1] [train], epoch: 11/50, iter: 700/834, loss: 0.36173, lr: 1.333127, top1: 0.53719, throughput: 314.09 | 2022-04-11 02:38:02.029 [rank:3] [train], epoch: 11/50, iter: 700/834, loss: 0.35861, lr: 1.333127, top1: 0.54370, throughput: 314.36 | 2022-04-11 02:38:02.029 [rank:4] [train], epoch: 11/50, iter: 700/834, loss: 0.36220, lr: 1.333127, top1: 0.53521, throughput: 313.98 | 2022-04-11 02:38:02.032 [rank:5] [train], epoch: 11/50, iter: 700/834, loss: 0.36168, lr: 1.333127, top1: 0.53917, throughput: 313.92 | 2022-04-11 02:38:02.042 [rank:2] [train], epoch: 11/50, iter: 700/834, loss: 0.36119, lr: 1.333127, top1: 0.53708, throughput: 314.06 | 2022-04-11 02:38:02.050 [rank:7] [train], epoch: 11/50, iter: 700/834, loss: 0.36132, lr: 1.333127, top1: 0.53599, throughput: 314.39 | 2022-04-11 02:38:01.983 [rank:0] [train], epoch: 11/50, iter: 800/834, loss: 0.36122, lr: 1.329193, top1: 0.53578, throughput: 312.61 | 2022-04-11 02:39:03.408 [rank:7] [train], epoch: 11/50, iter: 800/834, loss: 0.36264, lr: 1.329193, top1: 0.53417, throughput: 312.55 | 2022-04-11 02:39:03.412 [rank:6] [train], epoch: 11/50, iter: 800/834, loss: 0.35871, lr: 1.329193, top1: 0.54161, throughput: 312.69 | 2022-04-11 02:39:03.424 [rank:5] [train], epoch: 11/50, iter: 800/834, loss: 0.36005, lr: 1.329193, top1: 0.53771, throughput: 312.79 | 2022-04-11 02:39:03.425 [rank:4] [train], epoch: 11/50, iter: 800/834, loss: 0.35887, lr: 1.329193, top1: 0.53974, throughput: 312.72 | 2022-04-11 02:39:03.428 [rank:3] [train], epoch: 11/50, iter: 800/834, loss: 0.36094, lr: 1.329193, top1: 0.53724, throughput: 312.62 | 2022-04-11 02:39:03.446 [rank:2] [train], epoch: 11/50, iter: 800/834, loss: 0.36234, lr: 1.329193, top1: 0.53969, throughput: 312.72 | 2022-04-11 02:39:03.447 [rank:1] [train], epoch: 11/50, iter: 800/834, loss: 0.36210, lr: 1.329193, top1: 0.53422, throughput: 312.53 | 2022-04-11 02:39:03.463 [rank:5] [train], epoch: 11/50, iter: 834/834, loss: 0.36463, lr: 1.327848, top1: 0.52941, throughput: 311.43 | 2022-04-11 02:39:24.386 [rank:6] [train], epoch: 11/50, iter: 834/834, loss: 0.36223, lr: 1.327848, top1: 0.53202, throughput: 311.23 | 2022-04-11 02:39:24.399 [rank:3] [train], epoch: 11/50, iter: 834/834, loss: 0.35875, lr: 1.327848, top1: 0.53937, throughput: 311.53 | 2022-04-11 02:39:24.400 [rank:2] [train], epoch: 11/50, iter: 834/834, loss: 0.36224, lr: 1.327848, top1: 0.53937, throughput: 311.49 | 2022-04-11 02:39:24.404 [rank:4] [train], epoch: 11/50, iter: 834/834, loss: 0.36117, lr: 1.327848, top1: 0.54565, throughput: 311.05 | 2022-04-11 02:39:24.415 [rank:7] [train], epoch: 11/50, iter: 834/834, loss: 0.35974, lr: 1.327848, top1: 0.53493, throughput: 310.74 | 2022-04-11 02:39:24.420 [rank:0] [train], epoch: 11/50, iter: 834/834, loss: 0.35834, lr: 1.327848, top1: 0.53937, throughput: 310.55 | 2022-04-11 02:39:24.428 [rank:1] [train], epoch: 11/50, iter: 834/834, loss: 0.35756, lr: 1.327848, top1: 0.54197, throughput: 310.93 | 2022-04-11 02:39:24.459 [rank:0] [eval], epoch: 11/50, iter: 125/125, loss: 0.00000, lr: 1.327848, top1: 0.55872, throughput: 483.73 | 2022-04-11 02:39:37.349 [rank:4] [eval], epoch: 11/50, iter: 125/125, loss: 0.00000, lr: 1.327848, top1: 0.54432, throughput: 483.04 | 2022-04-11 02:39:37.354 [rank:5] [eval], epoch: 11/50, iter: 125/125, loss: 0.00000, lr: 1.327848, top1: 0.53456, throughput: 481.47 | 2022-04-11 02:39:37.367 [rank:7] [eval], epoch: 11/50, iter: 125/125, loss: 0.00000, lr: 1.327848, top1: 0.54448, throughput: 482.66 | 2022-04-11 02:39:37.369 [rank:2] [eval], epoch: 11/50, iter: 125/125, loss: 0.00000, lr: 1.327848, top1: 0.53840, throughput: 481.76 | 2022-04-11 02:39:37.377 [rank:6] [eval], epoch: 11/50, iter: 125/125, loss: 0.00000, lr: 1.327848, top1: 0.54768, throughput: 481.57 | 2022-04-11 02:39:37.377 [rank:3] [eval], epoch: 11/50, iter: 125/125, loss: 0.00000, lr: 1.327848, top1: 0.54080, throughput: 481.24 | 2022-04-11 02:39:37.388 [rank:1] [eval], epoch: 11/50, iter: 125/125, loss: 0.00000, lr: 1.327848, top1: 0.54976, throughput: 482.74 | 2022-04-11 02:39:37.406 [rank:7] [train], epoch: 12/50, iter: 100/834, loss: 0.35621, lr: 1.323871, top1: 0.55010, throughput: 311.50 | 2022-04-11 02:40:39.008 [rank:4] [train], epoch: 12/50, iter: 100/834, loss: 0.35739, lr: 1.323871, top1: 0.54453, throughput: 311.37 | 2022-04-11 02:40:39.017 [rank:6] [train], epoch: 12/50, iter: 100/834, loss: 0.35602, lr: 1.323871, top1: 0.54599, throughput: 311.47 | 2022-04-11 02:40:39.021 [rank:5] [train], epoch: 12/50, iter: 100/834, loss: 0.35388, lr: 1.323871, top1: 0.55229, throughput: 311.31 | 2022-04-11 02:40:39.041 [rank:0] [train], epoch: 12/50, iter: 100/834, loss: 0.35640, lr: 1.323871, top1: 0.54255, throughput: 311.13 | 2022-04-11 02:40:39.060 [rank:3] [train], epoch: 12/50, iter: 100/834, loss: 0.35581, lr: 1.323871, top1: 0.54458, throughput: 311.32 | 2022-04-11 02:40:39.062 [rank:2] [train], epoch: 12/50, iter: 100/834, loss: 0.35539, lr: 1.323871, top1: 0.54688, throughput: 311.23 | 2022-04-11 02:40:39.068 [rank:1] [train], epoch: 12/50, iter: 100/834, loss: 0.35420, lr: 1.323871, top1: 0.54943, throughput: 311.36 | 2022-04-11 02:40:39.071 [rank:4] [train], epoch: 12/50, iter: 200/834, loss: 0.35528, lr: 1.319863, top1: 0.54714, throughput: 313.51 | 2022-04-11 02:41:40.259 [rank:1] [train], epoch: 12/50, iter: 200/834, loss: 0.35634, lr: 1.319863, top1: 0.54859, throughput: 313.66 | 2022-04-11 02:41:40.284 [rank:6] [train], epoch: 12/50, iter: 200/834, loss: 0.35826, lr: 1.319863, top1: 0.54359, throughput: 313.39 | 2022-04-11 02:41:40.286 [rank:5] [train], epoch: 12/50, iter: 200/834, loss: 0.35937, lr: 1.319863, top1: 0.53516, throughput: 313.33 | 2022-04-11 02:41:40.319 [rank:2] [train], epoch: 12/50, iter: 200/834, loss: 0.35549, lr: 1.319863, top1: 0.54505, throughput: 313.42 | 2022-04-11 02:41:40.329 [rank:0] [train], epoch: 12/50, iter: 200/834, loss: 0.35282, lr: 1.319863, top1: 0.55714, throughput: 313.37 | 2022-04-11 02:41:40.329 [rank:7] [train], epoch: 12/50, iter: 200/834, loss: 0.35512, lr: 1.319863, top1: 0.54823, throughput: 313.07 | 2022-04-11 02:41:40.335 [rank:3] [train], epoch: 12/50, iter: 200/834, loss: 0.35700, lr: 1.319863, top1: 0.54641, throughput: 313.31 | 2022-04-11 02:41:40.344 [rank:1] [train], epoch: 12/50, iter: 300/834, loss: 0.35862, lr: 1.315824, top1: 0.54490, throughput: 313.02 | 2022-04-11 02:42:41.622 [rank:7] [train], epoch: 12/50, iter: 300/834, loss: 0.35870, lr: 1.315824, top1: 0.53859, throughput: 313.03 | 2022-04-11 02:42:41.670 [rank:0] [train], epoch: 12/50, iter: 300/834, loss: 0.35453, lr: 1.315824, top1: 0.54734, throughput: 312.93 | 2022-04-11 02:42:41.685 [rank:2] [train], epoch: 12/50, iter: 300/834, loss: 0.35694, lr: 1.315824, top1: 0.54750, throughput: 312.80 | 2022-04-11 02:42:41.710 [rank:3] [train], epoch: 12/50, iter: 300/834, loss: 0.35895, lr: 1.315824, top1: 0.54151, throughput: 312.82 | 2022-04-11 02:42:41.721 [rank:6] [train], epoch: 12/50, iter: 300/834, loss: 0.35582, lr: 1.315824, top1: 0.54854, throughput: 312.53 | 2022-04-11 02:42:41.720 [rank:5] [train], epoch: 12/50, iter: 300/834, loss: 0.35709, lr: 1.315824, top1: 0.54510, throughput: 312.65 | 2022-04-11 02:42:41.729 [rank:4] [train], epoch: 12/50, iter: 300/834, loss: 0.36035, lr: 1.315824, top1: 0.53781, throughput: 312.24 | 2022-04-11 02:42:41.750 [rank:6] [train], epoch: 12/50, iter: 400/834, loss: 0.35665, lr: 1.311753, top1: 0.54630, throughput: 314.26 | 2022-04-11 02:43:42.817 [rank:5] [train], epoch: 12/50, iter: 400/834, loss: 0.35347, lr: 1.311753, top1: 0.55271, throughput: 314.24 | 2022-04-11 02:43:42.830 [rank:1] [train], epoch: 12/50, iter: 400/834, loss: 0.35544, lr: 1.311753, top1: 0.54828, throughput: 313.68 | 2022-04-11 02:43:42.832 [rank:4] [train], epoch: 12/50, iter: 400/834, loss: 0.35452, lr: 1.311753, top1: 0.54750, throughput: 314.33 | 2022-04-11 02:43:42.833 [rank:2] [train], epoch: 12/50, iter: 400/834, loss: 0.35879, lr: 1.311753, top1: 0.54260, throughput: 313.95 | 2022-04-11 02:43:42.866 [rank:3] [train], epoch: 12/50, iter: 400/834, loss: 0.35493, lr: 1.311753, top1: 0.55531, throughput: 313.88 | 2022-04-11 02:43:42.891 [rank:7] [train], epoch: 12/50, iter: 400/834, loss: 0.35654, lr: 1.311753, top1: 0.54661, throughput: 313.58 | 2022-04-11 02:43:42.898 [rank:0] [train], epoch: 12/50, iter: 400/834, loss: 0.35505, lr: 1.311753, top1: 0.54693, throughput: 314.04 | 2022-04-11 02:43:42.825 [rank:1] [train], epoch: 12/50, iter: 500/834, loss: 0.35675, lr: 1.307652, top1: 0.54552, throughput: 312.34 | 2022-04-11 02:44:44.304 [rank:6] [train], epoch: 12/50, iter: 500/834, loss: 0.35726, lr: 1.307652, top1: 0.54505, throughput: 312.24 | 2022-04-11 02:44:44.308 [rank:2] [train], epoch: 12/50, iter: 500/834, loss: 0.35428, lr: 1.307652, top1: 0.55104, throughput: 312.37 | 2022-04-11 02:44:44.331 [rank:7] [train], epoch: 12/50, iter: 500/834, loss: 0.35503, lr: 1.307652, top1: 0.55021, throughput: 312.46 | 2022-04-11 02:44:44.346 [rank:5] [train], epoch: 12/50, iter: 500/834, loss: 0.35613, lr: 1.307652, top1: 0.54542, throughput: 312.11 | 2022-04-11 02:44:44.347 [rank:0] [train], epoch: 12/50, iter: 500/834, loss: 0.35501, lr: 1.307652, top1: 0.54641, throughput: 312.08 | 2022-04-11 02:44:44.348 [rank:3] [train], epoch: 12/50, iter: 500/834, loss: 0.35897, lr: 1.307652, top1: 0.53849, throughput: 312.31 | 2022-04-11 02:44:44.368 [rank:4] [train], epoch: 12/50, iter: 500/834, loss: 0.35716, lr: 1.307652, top1: 0.54604, throughput: 312.40 | 2022-04-11 02:44:44.293 [rank:6] [train], epoch: 12/50, iter: 600/834, loss: 0.35727, lr: 1.303520, top1: 0.54380, throughput: 311.75 | 2022-04-11 02:45:45.896 [rank:7] [train], epoch: 12/50, iter: 600/834, loss: 0.35645, lr: 1.303520, top1: 0.54401, throughput: 311.88 | 2022-04-11 02:45:45.907 [rank:4] [train], epoch: 12/50, iter: 600/834, loss: 0.35726, lr: 1.303520, top1: 0.53964, throughput: 311.58 | 2022-04-11 02:45:45.915 [rank:5] [train], epoch: 12/50, iter: 600/834, loss: 0.35752, lr: 1.303520, top1: 0.54516, throughput: 311.85 | 2022-04-11 02:45:45.914 [rank:1] [train], epoch: 12/50, iter: 600/834, loss: 0.35901, lr: 1.303520, top1: 0.54266, throughput: 311.56 | 2022-04-11 02:45:45.930 [rank:3] [train], epoch: 12/50, iter: 600/834, loss: 0.35608, lr: 1.303520, top1: 0.54719, throughput: 311.83 | 2022-04-11 02:45:45.940 [rank:0] [train], epoch: 12/50, iter: 600/834, loss: 0.35823, lr: 1.303520, top1: 0.54208, throughput: 311.71 | 2022-04-11 02:45:45.944 [rank:2] [train], epoch: 12/50, iter: 600/834, loss: 0.35640, lr: 1.303520, top1: 0.54599, throughput: 311.49 | 2022-04-11 02:45:45.971 [rank:4] [train], epoch: 12/50, iter: 700/834, loss: 0.35947, lr: 1.299357, top1: 0.53693, throughput: 311.35 | 2022-04-11 02:46:47.582 [rank:1] [train], epoch: 12/50, iter: 700/834, loss: 0.35693, lr: 1.299357, top1: 0.54318, throughput: 311.41 | 2022-04-11 02:46:47.584 [rank:7] [train], epoch: 12/50, iter: 700/834, loss: 0.35611, lr: 1.299357, top1: 0.54865, throughput: 311.24 | 2022-04-11 02:46:47.596 [rank:6] [train], epoch: 12/50, iter: 700/834, loss: 0.35811, lr: 1.299357, top1: 0.53818, throughput: 311.08 | 2022-04-11 02:46:47.616 [rank:5] [train], epoch: 12/50, iter: 700/834, loss: 0.35724, lr: 1.299357, top1: 0.54490, throughput: 311.07 | 2022-04-11 02:46:47.636 [rank:2] [train], epoch: 12/50, iter: 700/834, loss: 0.35630, lr: 1.299357, top1: 0.54396, throughput: 311.35 | 2022-04-11 02:46:47.637 [rank:0] [train], epoch: 12/50, iter: 700/834, loss: 0.35583, lr: 1.299357, top1: 0.55026, throughput: 311.12 | 2022-04-11 02:46:47.657 [rank:3] [train], epoch: 12/50, iter: 700/834, loss: 0.35914, lr: 1.299357, top1: 0.54302, throughput: 311.05 | 2022-04-11 02:46:47.667 [rank:6] [train], epoch: 12/50, iter: 800/834, loss: 0.35812, lr: 1.295164, top1: 0.54167, throughput: 313.71 | 2022-04-11 02:47:48.819 [rank:0] [train], epoch: 12/50, iter: 800/834, loss: 0.35891, lr: 1.295164, top1: 0.53719, throughput: 313.91 | 2022-04-11 02:47:48.821 [rank:7] [train], epoch: 12/50, iter: 800/834, loss: 0.35737, lr: 1.295164, top1: 0.54438, throughput: 313.51 | 2022-04-11 02:47:48.838 [rank:3] [train], epoch: 12/50, iter: 800/834, loss: 0.35960, lr: 1.295164, top1: 0.54172, throughput: 313.83 | 2022-04-11 02:47:48.847 [rank:5] [train], epoch: 12/50, iter: 800/834, loss: 0.35629, lr: 1.295164, top1: 0.54807, throughput: 313.62 | 2022-04-11 02:47:48.857 [rank:4] [train], epoch: 12/50, iter: 800/834, loss: 0.35500, lr: 1.295164, top1: 0.54661, throughput: 313.32 | 2022-04-11 02:47:48.862 [rank:1] [train], epoch: 12/50, iter: 800/834, loss: 0.35530, lr: 1.295164, top1: 0.54943, throughput: 313.27 | 2022-04-11 02:47:48.873 [rank:2] [train], epoch: 12/50, iter: 800/834, loss: 0.35905, lr: 1.295164, top1: 0.54385, throughput: 313.50 | 2022-04-11 02:47:48.881 [rank:4] [train], epoch: 12/50, iter: 834/834, loss: 0.35866, lr: 1.293732, top1: 0.54243, throughput: 314.81 | 2022-04-11 02:48:09.598 [rank:5] [train], epoch: 12/50, iter: 834/834, loss: 0.35501, lr: 1.293732, top1: 0.53968, throughput: 314.56 | 2022-04-11 02:48:09.610 [rank:1] [train], epoch: 12/50, iter: 834/834, loss: 0.35599, lr: 1.293732, top1: 0.54596, throughput: 314.78 | 2022-04-11 02:48:09.611 [rank:6] [train], epoch: 12/50, iter: 834/834, loss: 0.35732, lr: 1.293732, top1: 0.54795, throughput: 313.97 | 2022-04-11 02:48:09.611 [rank:2] [train], epoch: 12/50, iter: 834/834, loss: 0.36136, lr: 1.293732, top1: 0.53600, throughput: 314.90 | 2022-04-11 02:48:09.611 [rank:0] [train], epoch: 12/50, iter: 834/834, loss: 0.35729, lr: 1.293732, top1: 0.55025, throughput: 313.88 | 2022-04-11 02:48:09.619 [rank:3] [train], epoch: 12/50, iter: 834/834, loss: 0.35598, lr: 1.293732, top1: 0.55178, throughput: 314.06 | 2022-04-11 02:48:09.632 [rank:7] [train], epoch: 12/50, iter: 834/834, loss: 0.35244, lr: 1.293732, top1: 0.55898, throughput: 313.90 | 2022-04-11 02:48:09.635 [rank:0] [eval], epoch: 12/50, iter: 125/125, loss: 0.00000, lr: 1.293732, top1: 0.55968, throughput: 485.65 | 2022-04-11 02:48:22.489 [rank:4] [eval], epoch: 12/50, iter: 125/125, loss: 0.00000, lr: 1.293732, top1: 0.54560, throughput: 484.59 | 2022-04-11 02:48:22.495 [rank:2] [eval], epoch: 12/50, iter: 125/125, loss: 0.00000, lr: 1.293732, top1: 0.55392, throughput: 484.97 | 2022-04-11 02:48:22.499 [rank:7] [eval], epoch: 12/50, iter: 125/125, loss: 0.00000, lr: 1.293732, top1: 0.55216, throughput: 485.31 | 2022-04-11 02:48:22.513 [rank:6] [eval], epoch: 12/50, iter: 125/125, loss: 0.00000, lr: 1.293732, top1: 0.55200, throughput: 484.34 | 2022-04-11 02:48:22.515 [rank:5] [eval], epoch: 12/50, iter: 125/125, loss: 0.00000, lr: 1.293732, top1: 0.54448, throughput: 484.30 | 2022-04-11 02:48:22.515 [rank:3] [eval], epoch: 12/50, iter: 125/125, loss: 0.00000, lr: 1.293732, top1: 0.54608, throughput: 485.10 | 2022-04-11 02:48:22.516 [rank:1] [eval], epoch: 12/50, iter: 125/125, loss: 0.00000, lr: 1.293732, top1: 0.55392, throughput: 483.75 | 2022-04-11 02:48:22.531 [rank:2] [train], epoch: 13/50, iter: 100/834, loss: 0.35339, lr: 1.289500, top1: 0.55245, throughput: 314.29 | 2022-04-11 02:49:23.590 [rank:5] [train], epoch: 13/50, iter: 100/834, loss: 0.35331, lr: 1.289500, top1: 0.55276, throughput: 314.32 | 2022-04-11 02:49:23.599 [rank:4] [train], epoch: 13/50, iter: 100/834, loss: 0.34853, lr: 1.289500, top1: 0.56292, throughput: 314.12 | 2022-04-11 02:49:23.618 [rank:1] [train], epoch: 13/50, iter: 100/834, loss: 0.34795, lr: 1.289500, top1: 0.56240, throughput: 314.27 | 2022-04-11 02:49:23.624 [rank:0] [train], epoch: 13/50, iter: 100/834, loss: 0.35191, lr: 1.289500, top1: 0.55328, throughput: 314.05 | 2022-04-11 02:49:23.626 [rank:3] [train], epoch: 13/50, iter: 100/834, loss: 0.34923, lr: 1.289500, top1: 0.55979, throughput: 314.16 | 2022-04-11 02:49:23.632 [rank:6] [train], epoch: 13/50, iter: 100/834, loss: 0.35211, lr: 1.289500, top1: 0.55010, throughput: 313.98 | 2022-04-11 02:49:23.665 [rank:7] [train], epoch: 13/50, iter: 100/834, loss: 0.34741, lr: 1.289500, top1: 0.56453, throughput: 313.84 | 2022-04-11 02:49:23.691 [rank:0] [train], epoch: 13/50, iter: 200/834, loss: 0.35644, lr: 1.285237, top1: 0.54427, throughput: 313.70 | 2022-04-11 02:50:24.831 [rank:7] [train], epoch: 13/50, iter: 200/834, loss: 0.35132, lr: 1.285237, top1: 0.55734, throughput: 314.01 | 2022-04-11 02:50:24.835 [rank:4] [train], epoch: 13/50, iter: 200/834, loss: 0.35094, lr: 1.285237, top1: 0.54990, throughput: 313.62[rank:2] [train], epoch: 13/50, iter: 200/834, loss: 0.35325, lr: 1.285237, top1: 0.55234, throughput: 313.48 | 2022-04-11 02:50:24.838 | 2022-04-11 02:50:24.838 [rank:3] [train], epoch: 13/50, iter: 200/834, loss: 0.35448, lr: 1.285237, top1: 0.54630, throughput: 313.65 | 2022-04-11 02:50:24.847 [rank:6] [train], epoch: 13/50, iter: 200/834, loss: 0.35141, lr: 1.285237, top1: 0.55375, throughput: 313.81 | 2022-04-11 02:50:24.849 [rank:5] [train], epoch: 13/50, iter: 200/834, loss: 0.35293, lr: 1.285237, top1: 0.55271, throughput: 313.81 | 2022-04-11 02:50:24.784 [rank:1] [train], epoch: 13/50, iter: 200/834, loss: 0.34992, lr: 1.285237, top1: 0.56490, throughput: 313.38 | 2022-04-11 02:50:24.891 [rank:1] [train], epoch: 13/50, iter: 300/834, loss: 0.35500, lr: 1.280946, top1: 0.55000, throughput: 314.71 | 2022-04-11 02:51:25.899 [rank:7] [train], epoch: 13/50, iter: 300/834, loss: 0.35100, lr: 1.280946, top1: 0.55724, throughput: 314.31 | 2022-04-11 02:51:25.922 [rank:0] [train], epoch: 13/50, iter: 300/834, loss: 0.35351, lr: 1.280946, top1: 0.54755, throughput: 314.24 | 2022-04-11 02:51:25.930 [rank:5] [train], epoch: 13/50, iter: 300/834, loss: 0.35161, lr: 1.280946, top1: 0.55740, throughput: 313.95 | 2022-04-11 02:51:25.941 [rank:6] [train], epoch: 13/50, iter: 300/834, loss: 0.35238, lr: 1.280946, top1: 0.55396, throughput: 314.27 | 2022-04-11 02:51:25.943 [rank:4] [train], epoch: 13/50, iter: 300/834, loss: 0.35131, lr: 1.280946, top1: 0.55760, throughput: 314.17 | 2022-04-11 02:51:25.953 [rank:3] [train], epoch: 13/50, iter: 300/834, loss: 0.35342, lr: 1.280946, top1: 0.54849, throughput: 314.55 | 2022-04-11 02:51:25.887 [rank:2] [train], epoch: 13/50, iter: 300/834, loss: 0.35472, lr: 1.280946, top1: 0.54714, throughput: 314.44 | 2022-04-11 02:51:25.898 [rank:6] [train], epoch: 13/50, iter: 400/834, loss: 0.35633, lr: 1.276625, top1: 0.54797, throughput: 313.65 | 2022-04-11 02:52:27.157 [rank:3] [train], epoch: 13/50, iter: 400/834, loss: 0.35250, lr: 1.276625, top1: 0.55313, throughput: 313.36 | 2022-04-11 02:52:27.157 [rank:0] [train], epoch: 13/50, iter: 400/834, loss: 0.35377, lr: 1.276625, top1: 0.55365, throughput: 313.52 | 2022-04-11 02:52:27.170 [rank:7] [train], epoch: 13/50, iter: 400/834, loss: 0.35297, lr: 1.276625, top1: 0.55146, throughput: 313.46 | 2022-04-11 02:52:27.173 [rank:1] [train], epoch: 13/50, iter: 400/834, loss: 0.35605, lr: 1.276625, top1: 0.54797, throughput: 313.30 | 2022-04-11 02:52:27.182 [rank:5] [train], epoch: 13/50, iter: 400/834, loss: 0.35086, lr: 1.276625, top1: 0.55729, throughput: 313.41 | 2022-04-11 02:52:27.203 [rank:4] [train], epoch: 13/50, iter: 400/834, loss: 0.35574, lr: 1.276625, top1: 0.54844, throughput: 313.43 | 2022-04-11 02:52:27.210 [rank:2] [train], epoch: 13/50, iter: 400/834, loss: 0.35350, lr: 1.276625, top1: 0.55115, throughput: 313.01 | 2022-04-11 02:52:27.239 [rank:4] [train], epoch: 13/50, iter: 500/834, loss: 0.35440, lr: 1.272275, top1: 0.54422, throughput: 314.14 | 2022-04-11 02:53:28.328 [rank:5] [train], epoch: 13/50, iter: 500/834, loss: 0.35181, lr: 1.272275, top1: 0.55474, throughput: 314.08 | 2022-04-11 02:53:28.334 [rank:0] [train], epoch: 13/50, iter: 500/834, loss: 0.35614, lr: 1.272275, top1: 0.54729, throughput: 313.81 | 2022-04-11 02:53:28.354 [rank:1] [train], epoch: 13/50, iter: 500/834, loss: 0.35438, lr: 1.272275, top1: 0.55109, throughput: 313.78 | 2022-04-11 02:53:28.371 [rank:7] [train], epoch: 13/50, iter: 500/834, loss: 0.35444, lr: 1.272275, top1: 0.54880, throughput: 313.67 | 2022-04-11 02:53:28.384 [rank:6] [train], epoch: 13/50, iter: 500/834, loss: 0.35129, lr: 1.272275, top1: 0.55516, throughput: 313.58 | 2022-04-11 02:53:28.385 [rank:2] [train], epoch: 13/50, iter: 500/834, loss: 0.35131, lr: 1.272275, top1: 0.55755, throughput: 313.95 | 2022-04-11 02:53:28.396 [rank:3] [train], epoch: 13/50, iter: 500/834, loss: 0.35055, lr: 1.272275, top1: 0.55661, throughput: 313.92 | 2022-04-11 02:53:28.320 [rank:2] [train], epoch: 13/50, iter: 600/834, loss: 0.35095, lr: 1.267897, top1: 0.55422, throughput: 314.31 | 2022-04-11 02:54:29.482 [rank:1] [train], epoch: 13/50, iter: 600/834, loss: 0.35174, lr: 1.267897, top1: 0.55557, throughput: 314.04 | 2022-04-11 02:54:29.510 [rank:3] [train], epoch: 13/50, iter: 600/834, loss: 0.35588, lr: 1.267897, top1: 0.54948, throughput: 313.74 | 2022-04-11 02:54:29.517 [rank:5] [train], epoch: 13/50, iter: 600/834, loss: 0.35161, lr: 1.267897, top1: 0.55703, throughput: 313.76 | 2022-04-11 02:54:29.526 [rank:7] [train], epoch: 13/50, iter: 600/834, loss: 0.35215, lr: 1.267897, top1: 0.55672, throughput: 314.01 | 2022-04-11 02:54:29.529 [rank:6] [train], epoch: 13/50, iter: 600/834, loss: 0.35265, lr: 1.267897, top1: 0.55411, throughput: 313.94 | 2022-04-11 02:54:29.543 [rank:4] [train], epoch: 13/50, iter: 600/834, loss: 0.35128, lr: 1.267897, top1: 0.55156, throughput: 313.58 | 2022-04-11 02:54:29.556 [rank:0] [train], epoch: 13/50, iter: 600/834, loss: 0.35246, lr: 1.267897, top1: 0.55229, throughput: 313.53 | 2022-04-11 02:54:29.592 [rank:7] [train], epoch: 13/50, iter: 700/834, loss: 0.35171, lr: 1.263491, top1: 0.55411, throughput: 311.01 | 2022-04-11 02:55:31.263 [rank:0] [train], epoch: 13/50, iter: 700/834, loss: 0.35454, lr: 1.263491, top1: 0.55057, throughput: 311.21 | 2022-04-11 02:55:31.288 [rank:5] [train], epoch: 13/50, iter: 700/834, loss: 0.35417, lr: 1.263491, top1: 0.54740, throughput: 310.86 | 2022-04-11 02:55:31.290 [rank:2] [train], epoch: 13/50, iter: 700/834, loss: 0.35185, lr: 1.263491, top1: 0.55464, throughput: 310.62 | 2022-04-11 02:55:31.294 [rank:3] [train], epoch: 13/50, iter: 700/834, loss: 0.35273, lr: 1.263491, top1: 0.55521, throughput: 310.75 | 2022-04-11 02:55:31.303 [rank:6] [train], epoch: 13/50, iter: 700/834, loss: 0.35363, lr: 1.263491, top1: 0.55313, throughput: 310.86 | 2022-04-11 02:55:31.307 [rank:4] [train], epoch: 13/50, iter: 700/834, loss: 0.35324, lr: 1.263491, top1: 0.55120, throughput: 310.89 | 2022-04-11 02:55:31.315 [rank:1] [train], epoch: 13/50, iter: 700/834, loss: 0.35093, lr: 1.263491, top1: 0.55557, throughput: 310.56 | 2022-04-11 02:55:31.333 [rank:5] [train], epoch: 13/50, iter: 800/834, loss: 0.35167, lr: 1.259056, top1: 0.55208, throughput: 311.83 | 2022-04-11 02:56:32.863 [rank:7] [train], epoch: 13/50, iter: 800/834, loss: 0.35305, lr: 1.259056, top1: 0.55224, throughput: 311.41 | 2022-04-11 02:56:32.918 [rank:6] [train], epoch: 13/50, iter: 800/834, loss: 0.35549, lr: 1.259056, top1: 0.54958, throughput: 311.46 | 2022-04-11 02:56:32.952 [rank:3] [train], epoch: 13/50, iter: 800/834, loss: 0.35461, lr: 1.259056, top1: 0.55005, throughput: 311.44 | 2022-04-11 02:56:32.953 [rank:1] [train], epoch: 13/50, iter: 800/834, loss: 0.35466, lr: 1.259056, top1: 0.55141, throughput: 311.76 | 2022-04-11 02:56:32.920 [rank:4] [train], epoch: 13/50, iter: 800/834, loss: 0.35712, lr: 1.259056, top1: 0.54448, throughput: 311.23 | 2022-04-11 02:56:33.007 [rank:0] [train], epoch: 13/50, iter: 800/834, loss: 0.35544, lr: 1.259056, top1: 0.54990, throughput: 311.00 | 2022-04-11 02:56:33.023 [rank:2] [train], epoch: 13/50, iter: 800/834, loss: 0.35321, lr: 1.259056, top1: 0.55516, throughput: 310.98 | 2022-04-11 02:56:33.034 [rank:5] [train], epoch: 13/50, iter: 834/834, loss: 0.35114, lr: 1.257542, top1: 0.55407, throughput: 311.64 | 2022-04-11 02:56:53.810 [rank:6] [train], epoch: 13/50, iter: 834/834, loss: 0.34804, lr: 1.257542, top1: 0.56602, throughput: 312.70 | 2022-04-11 02:56:53.829 [rank:7] [train], epoch: 13/50, iter: 834/834, loss: 0.35055, lr: 1.257542, top1: 0.55423, throughput: 312.10 | 2022-04-11 02:56:53.834 [rank:1] [train], epoch: 13/50, iter: 834/834, loss: 0.35819, lr: 1.257542, top1: 0.53263, throughput: 312.03 | 2022-04-11 02:56:53.841 [rank:4] [train], epoch: 13/50, iter: 834/834, loss: 0.34850, lr: 1.257542, top1: 0.55959, throughput: 313.27 | 2022-04-11 02:56:53.845 [rank:0] [train], epoch: 13/50, iter: 834/834, loss: 0.35227, lr: 1.257542, top1: 0.55193, throughput: 313.44 | 2022-04-11 02:56:53.850 [rank:3] [train], epoch: 13/50, iter: 834/834, loss: 0.35352, lr: 1.257542, top1: 0.55790, throughput: 312.24 | 2022-04-11 02:56:53.860 [rank:2] [train], epoch: 13/50, iter: 834/834, loss: 0.35444, lr: 1.257542, top1: 0.54887, throughput: 313.43 | 2022-04-11 02:56:53.861 [rank:0] [eval], epoch: 13/50, iter: 125/125, loss: 0.00000, lr: 1.257542, top1: 0.56048, throughput: 489.44 | 2022-04-11 02:57:06.620 [rank:7] [eval], epoch: 13/50, iter: 125/125, loss: 0.00000, lr: 1.257542, top1: 0.56096, throughput: 488.47 | 2022-04-11 02:57:06.629 [rank:4] [eval], epoch: 13/50, iter: 125/125, loss: 0.00000, lr: 1.257542, top1: 0.55104, throughput: 488.86 | 2022-04-11 02:57:06.630 [rank:2] [eval], epoch: 13/50, iter: 125/125, loss: 0.00000, lr: 1.257542, top1: 0.54224, throughput: 489.22 | 2022-04-11 02:57:06.637 [rank:6] [eval], epoch: 13/50, iter: 125/125, loss: 0.00000, lr: 1.257542, top1: 0.55872, throughput: 487.91 | 2022-04-11 02:57:06.638 [rank:5] [eval], epoch: 13/50, iter: 125/125, loss: 0.00000, lr: 1.257542, top1: 0.54384, throughput: 487.19 | 2022-04-11 02:57:06.639 [rank:3] [eval], epoch: 13/50, iter: 125/125, loss: 0.00000, lr: 1.257542, top1: 0.54640, throughput: 488.73 | 2022-04-11 02:57:06.648 [rank:1] [eval], epoch: 13/50, iter: 125/125, loss: 0.00000, lr: 1.257542, top1: 0.55792, throughput: 486.99 | 2022-04-11 02:57:06.675 [rank:4] [train], epoch: 14/50, iter: 100/834, loss: 0.34567, lr: 1.253070, top1: 0.56578, throughput: 315.18 | 2022-04-11 02:58:07.547 [rank:6] [train], epoch: 14/50, iter: 100/834, loss: 0.34639, lr: 1.253070, top1: 0.56214, throughput: 315.09 | 2022-04-11 02:58:07.574 [rank:7] [train], epoch: 14/50, iter: 100/834, loss: 0.34771, lr: 1.253070, top1: 0.56411, throughput: 314.94 | 2022-04-11 02:58:07.593 [rank:5] [train], epoch: 14/50, iter: 100/834, loss: 0.34375, lr: 1.253070, top1: 0.56984, throughput: 314.94 | 2022-04-11 02:58:07.603 [rank:0] [train], epoch: 14/50, iter: 100/834, loss: 0.34679, lr: 1.253070, top1: 0.56354, throughput: 314.79 | 2022-04-11 02:58:07.613 [rank:1] [train], epoch: 14/50, iter: 100/834, loss: 0.34866, lr: 1.253070, top1: 0.56234, throughput: 315.01 | 2022-04-11 02:58:07.625 [rank:2] [train], epoch: 14/50, iter: 100/834, loss: 0.34880, lr: 1.253070, top1: 0.55875, throughput: 314.75 | 2022-04-11 02:58:07.638 [rank:3] [train], epoch: 14/50, iter: 100/834, loss: 0.34858, lr: 1.253070, top1: 0.56260, throughput: 315.18 | 2022-04-11 02:58:07.565 [rank:7] [train], epoch: 14/50, iter: 200/834, loss: 0.35014, lr: 1.248570, top1: 0.55859, throughput: 312.85 | 2022-04-11 02:59:08.965 [rank:4] [train], epoch: 14/50, iter: 200/834, loss: 0.34896, lr: 1.248570, top1: 0.56125, throughput: 312.55 | 2022-04-11 02:59:08.976 [rank:3] [train], epoch: 14/50, iter: 200/834, loss: 0.34847, lr: 1.248570, top1: 0.56068, throughput: 312.65 | 2022-04-11 02:59:08.976 [rank:1] [train], epoch: 14/50, iter: 200/834, loss: 0.34765, lr: 1.248570, top1: 0.56313, throughput: 312.93 | 2022-04-11 02:59:08.980 [rank:0] [train], epoch: 14/50, iter: 200/834, loss: 0.34807, lr: 1.248570, top1: 0.55995, throughput: 312.80 | 2022-04-11 02:59:08.993 [rank:5] [train], epoch: 14/50, iter: 200/834, loss: 0.34726, lr: 1.248570, top1: 0.56281, throughput: 312.68 | 2022-04-11 02:59:09.008 [rank:2] [train], epoch: 14/50, iter: 200/834, loss: 0.35040, lr: 1.248570, top1: 0.55953, throughput: 312.84 | 2022-04-11 02:59:09.010 [rank:6] [train], epoch: 14/50, iter: 200/834, loss: 0.34824, lr: 1.248570, top1: 0.55995, throughput: 312.78 | 2022-04-11 02:59:08.959 [rank:3] [train], epoch: 14/50, iter: 300/834, loss: 0.35128, lr: 1.244043, top1: 0.55516, throughput: 313.50 | 2022-04-11 03:00:10.220 [rank:1] [train], epoch: 14/50, iter: 300/834, loss: 0.34629, lr: 1.244043, top1: 0.56740, throughput: 313.41 | 2022-04-11 03:00:10.242 [rank:0] [train], epoch: 14/50, iter: 300/834, loss: 0.35039, lr: 1.244043, top1: 0.55604, throughput: 313.42 | 2022-04-11 03:00:10.253 [rank:6] [train], epoch: 14/50, iter: 300/834, loss: 0.34744, lr: 1.244043, top1: 0.55703, throughput: 313.19 | 2022-04-11 03:00:10.264 [rank:2] [train], epoch: 14/50, iter: 300/834, loss: 0.34875, lr: 1.244043, top1: 0.55698, throughput: 313.44 | 2022-04-11 03:00:10.265 [rank:4] [train], epoch: 14/50, iter: 300/834, loss: 0.35041, lr: 1.244043, top1: 0.55766, throughput: 313.26 | 2022-04-11 03:00:10.267 [rank:5] [train], epoch: 14/50, iter: 300/834, loss: 0.34835, lr: 1.244043, top1: 0.55646, throughput: 313.75 | 2022-04-11 03:00:10.204 [rank:7] [train], epoch: 14/50, iter: 300/834, loss: 0.34948, lr: 1.244043, top1: 0.55661, throughput: 312.93 | 2022-04-11 03:00:10.320 [rank:2] [train], epoch: 14/50, iter: 400/834, loss: 0.35050, lr: 1.239489, top1: 0.55786, throughput: 313.02 | 2022-04-11 03:01:11.603 [rank:7] [train], epoch: 14/50, iter: 400/834, loss: 0.35318, lr: 1.239489, top1: 0.55365, throughput: 313.28 | 2022-04-11 03:01:11.607 [rank:1] [train], epoch: 14/50, iter: 400/834, loss: 0.34793, lr: 1.239489, top1: 0.56375, throughput: 312.85 | 2022-04-11 03:01:11.614 [rank:6] [train], epoch: 14/50, iter: 400/834, loss: 0.34888, lr: 1.239489, top1: 0.56406, throughput: 312.93 | 2022-04-11 03:01:11.619 [rank:5] [train], epoch: 14/50, iter: 400/834, loss: 0.34885, lr: 1.239489, top1: 0.55760, throughput: 312.50 | 2022-04-11 03:01:11.644 [rank:4] [train], epoch: 14/50, iter: 400/834, loss: 0.34845, lr: 1.239489, top1: 0.55818, throughput: 312.79 | 2022-04-11 03:01:11.651 [rank:0] [train], epoch: 14/50, iter: 400/834, loss: 0.34993, lr: 1.239489, top1: 0.55719, throughput: 312.70 | 2022-04-11 03:01:11.653 [rank:3] [train], epoch: 14/50, iter: 400/834, loss: 0.34760, lr: 1.239489, top1: 0.56318, throughput: 312.92 | 2022-04-11 03:01:11.579 [rank:6] [train], epoch: 14/50, iter: 500/834, loss: 0.35147, lr: 1.234909, top1: 0.55521, throughput: 314.64 | 2022-04-11 03:02:12.641 [rank:3] [train], epoch: 14/50, iter: 500/834, loss: 0.34942, lr: 1.234909, top1: 0.55724, throughput: 314.30 | 2022-04-11 03:02:12.667 [rank:7] [train], epoch: 14/50, iter: 500/834, loss: 0.34996, lr: 1.234909, top1: 0.55703, throughput: 314.44 | 2022-04-11 03:02:12.667 [rank:5] [train], epoch: 14/50, iter: 500/834, loss: 0.35066, lr: 1.234909, top1: 0.55688, throughput: 314.63 | 2022-04-11 03:02:12.668 [rank:4] [train], epoch: 14/50, iter: 500/834, loss: 0.34865, lr: 1.234909, top1: 0.55849, throughput: 314.65 | 2022-04-11 03:02:12.671 [rank:1] [train], epoch: 14/50, iter: 500/834, loss: 0.34851, lr: 1.234909, top1: 0.55995, throughput: 314.42 | 2022-04-11 03:02:12.678 [rank:0] [train], epoch: 14/50, iter: 500/834, loss: 0.34750, lr: 1.234909, top1: 0.55943, throughput: 314.52 | 2022-04-11 03:02:12.698 [rank:2] [train], epoch: 14/50, iter: 500/834, loss: 0.35029, lr: 1.234909, top1: 0.55719, throughput: 314.22 | 2022-04-11 03:02:12.706 [rank:7] [train], epoch: 14/50, iter: 600/834, loss: 0.34973, lr: 1.230302, top1: 0.55839, throughput: 312.76 | 2022-04-11 03:03:14.056 [rank:5] [train], epoch: 14/50, iter: 600/834, loss: 0.35185, lr: 1.230302, top1: 0.55365, throughput: 312.69 | 2022-04-11 03:03:14.071 [rank:1] [train], epoch: 14/50, iter: 600/834, loss: 0.34544, lr: 1.230302, top1: 0.56635, throughput: 312.73 | 2022-04-11 03:03:14.072 [rank:4] [train], epoch: 14/50, iter: 600/834, loss: 0.35004, lr: 1.230302, top1: 0.55620, throughput: 312.66 | 2022-04-11 03:03:14.080 [rank:2] [train], epoch: 14/50, iter: 600/834, loss: 0.35138, lr: 1.230302, top1: 0.55344, throughput: 312.81 | 2022-04-11 03:03:14.084 [rank:6] [train], epoch: 14/50, iter: 600/834, loss: 0.34658, lr: 1.230302, top1: 0.56260, throughput: 312.47 | 2022-04-11 03:03:14.088 [rank:3] [train], epoch: 14/50, iter: 600/834, loss: 0.35045, lr: 1.230302, top1: 0.55698, throughput: 312.50 | 2022-04-11 03:03:14.108 [rank:0] [train], epoch: 14/50, iter: 600/834, loss: 0.35152, lr: 1.230302, top1: 0.55521, throughput: 312.49 | 2022-04-11 03:03:14.141 [rank:2] [train], epoch: 14/50, iter: 700/834, loss: 0.35054, lr: 1.225668, top1: 0.56120, throughput: 313.08 | 2022-04-11 03:04:15.409 [rank:6] [train], epoch: 14/50, iter: 700/834, loss: 0.35178, lr: 1.225668, top1: 0.55307, throughput: 312.66 | 2022-04-11 03:04:15.497 [rank:4] [train], epoch: 14/50, iter: 700/834, loss: 0.35172, lr: 1.225668, top1: 0.55255, throughput: 312.50 | 2022-04-11 03:04:15.519 [rank:5] [train], epoch: 14/50, iter: 700/834, loss: 0.35099, lr: 1.225668, top1: 0.55516, throughput: 312.44 | 2022-04-11 03:04:15.523 [rank:0] [train], epoch: 14/50, iter: 700/834, loss: 0.34931, lr: 1.225668, top1: 0.56026, throughput: 312.74 | 2022-04-11 03:04:15.534 [rank:3] [train], epoch: 14/50, iter: 700/834, loss: 0.34972, lr: 1.225668, top1: 0.55646, throughput: 312.49 | 2022-04-11 03:04:15.550 [rank:1] [train], epoch: 14/50, iter: 700/834, loss: 0.35097, lr: 1.225668, top1: 0.55677, throughput: 312.27 | 2022-04-11 03:04:15.557 [rank:7] [train], epoch: 14/50, iter: 700/834, loss: 0.35010, lr: 1.225668, top1: 0.55359, throughput: 312.00 | 2022-04-11 03:04:15.594 [rank:6] [train], epoch: 14/50, iter: 800/834, loss: 0.34555, lr: 1.221009, top1: 0.56354, throughput: 312.65 | 2022-04-11 03:05:16.907 [rank:5] [train], epoch: 14/50, iter: 800/834, loss: 0.34842, lr: 1.221009, top1: 0.55974, throughput: 312.72 | 2022-04-11 03:05:16.918 [rank:2] [train], epoch: 14/50, iter: 800/834, loss: 0.34950, lr: 1.221009, top1: 0.55792, throughput: 312.15 | 2022-04-11 03:05:16.918 [rank:0] [train], epoch: 14/50, iter: 800/834, loss: 0.34885, lr: 1.221009, top1: 0.56349, throughput: 312.64 | 2022-04-11 03:05:16.946 [rank:3] [train], epoch: 14/50, iter: 800/834, loss: 0.34965, lr: 1.221009, top1: 0.55969, throughput: 312.72 | 2022-04-11 03:05:16.946 [rank:4] [train], epoch: 14/50, iter: 800/834, loss: 0.34852, lr: 1.221009, top1: 0.55870, throughput: 312.47 | 2022-04-11 03:05:16.965 [rank:7] [train], epoch: 14/50, iter: 800/834, loss: 0.35048, lr: 1.221009, top1: 0.55651, throughput: 312.84 | 2022-04-11 03:05:16.967 [rank:1] [train], epoch: 14/50, iter: 800/834, loss: 0.34829, lr: 1.221009, top1: 0.56313, throughput: 312.64 | 2022-04-11 03:05:16.970 [rank:2] [train], epoch: 14/50, iter: 834/834, loss: 0.35422, lr: 1.219419, top1: 0.55224, throughput: 312.79 | 2022-04-11 03:05:37.789 [rank:5] [train], epoch: 14/50, iter: 834/834, loss: 0.34921, lr: 1.219419, top1: 0.56342, throughput: 312.73 | 2022-04-11 03:05:37.793 [rank:6] [train], epoch: 14/50, iter: 834/834, loss: 0.35349, lr: 1.219419, top1: 0.55469, throughput: 312.37 | 2022-04-11 03:05:37.805 [rank:7] [train], epoch: 14/50, iter: 834/834, loss: 0.34734, lr: 1.219419, top1: 0.55622, throughput: 313.21 | 2022-04-11 03:05:37.809 [rank:1] [train], epoch: 14/50, iter: 834/834, loss: 0.34805, lr: 1.219419, top1: 0.55990, throughput: 313.25 | 2022-04-11 03:05:37.809 [rank:4] [train], epoch: 14/50, iter: 834/834, loss: 0.34728, lr: 1.219419, top1: 0.55898, throughput: 313.16 | 2022-04-11 03:05:37.810 [rank:0] [train], epoch: 14/50, iter: 834/834, loss: 0.35582, lr: 1.219419, top1: 0.55070, throughput: 312.87 | 2022-04-11 03:05:37.810 [rank:3] [train], epoch: 14/50, iter: 834/834, loss: 0.35069, lr: 1.219419, top1: 0.56020, throughput: 312.84 | 2022-04-11 03:05:37.813 [rank:0] [eval], epoch: 14/50, iter: 125/125, loss: 0.00000, lr: 1.219419, top1: 0.56496, throughput: 489.27 | 2022-04-11 03:05:50.584 [rank:2] [eval], epoch: 14/50, iter: 125/125, loss: 0.00000, lr: 1.219419, top1: 0.55424, throughput: 488.43 | 2022-04-11 03:05:50.585 [rank:4] [eval], epoch: 14/50, iter: 125/125, loss: 0.00000, lr: 1.219419, top1: 0.55568, throughput: 489.23 | 2022-04-11 03:05:50.585 [rank:6] [eval], epoch: 14/50, iter: 125/125, loss: 0.00000, lr: 1.219419, top1: 0.56448, throughput: 489.03 | 2022-04-11 03:05:50.586 [rank:7] [eval], epoch: 14/50, iter: 125/125, loss: 0.00000, lr: 1.219419, top1: 0.56576, throughput: 489.11 | 2022-04-11 03:05:50.587 [rank:5] [eval], epoch: 14/50, iter: 125/125, loss: 0.00000, lr: 1.219419, top1: 0.54704, throughput: 488.40 | 2022-04-11 03:05:50.590 [rank:3] [eval], epoch: 14/50, iter: 125/125, loss: 0.00000, lr: 1.219419, top1: 0.55216, throughput: 488.42 | 2022-04-11 03:05:50.609 [rank:1] [eval], epoch: 14/50, iter: 125/125, loss: 0.00000, lr: 1.219419, top1: 0.56912, throughput: 487.85 | 2022-04-11 03:05:50.620 [rank:4] [train], epoch: 15/50, iter: 100/834, loss: 0.34504, lr: 1.214725, top1: 0.56818, throughput: 313.85 | 2022-04-11 03:06:51.762 [rank:6] [train], epoch: 15/50, iter: 100/834, loss: 0.33930, lr: 1.214725, top1: 0.57536, throughput: 313.77 | 2022-04-11 03:06:51.777 [rank:1] [train], epoch: 15/50, iter: 100/834, loss: 0.34294, lr: 1.214725, top1: 0.56865, throughput: 313.88 | 2022-04-11 03:06:51.791 [rank:7] [train], epoch: 15/50, iter: 100/834, loss: 0.34349, lr: 1.214725, top1: 0.56417, throughput: 313.63 | 2022-04-11 03:06:51.806 [rank:0] [train], epoch: 15/50, iter: 100/834, loss: 0.34113, lr: 1.214725, top1: 0.57089, throughput: 313.52 | 2022-04-11 03:06:51.825 [rank:3] [train], epoch: 15/50, iter: 100/834, loss: 0.34187, lr: 1.214725, top1: 0.57594, throughput: 313.97 | 2022-04-11 03:06:51.761 [rank:5] [train], epoch: 15/50, iter: 100/834, loss: 0.34126, lr: 1.214725, top1: 0.57510, throughput: 313.35 | 2022-04-11 03:06:51.863 [rank:2] [train], epoch: 15/50, iter: 100/834, loss: 0.34080, lr: 1.214725, top1: 0.57479, throughput: 313.79 | 2022-04-11 03:06:51.772 [rank:2] [train], epoch: 15/50, iter: 200/834, loss: 0.34563, lr: 1.210006, top1: 0.56578, throughput: 312.93 | 2022-04-11 03:07:53.127 [rank:3] [train], epoch: 15/50, iter: 200/834, loss: 0.34610, lr: 1.210006, top1: 0.56823, throughput: 312.86 | 2022-04-11 03:07:53.130 [rank:7] [train], epoch: 15/50, iter: 200/834, loss: 0.34799, lr: 1.210006, top1: 0.56135, throughput: 313.07 | 2022-04-11 03:07:53.134 [rank:0] [train], epoch: 15/50, iter: 200/834, loss: 0.34456, lr: 1.210006, top1: 0.56599, throughput: 313.16 | 2022-04-11 03:07:53.136 [rank:4] [train], epoch: 15/50, iter: 200/834, loss: 0.34655, lr: 1.210006, top1: 0.56906, throughput: 312.84 | 2022-04-11 03:07:53.136 [rank:6] [train], epoch: 15/50, iter: 200/834, loss: 0.34555, lr: 1.210006, top1: 0.56599, throughput: 312.88 | 2022-04-11 03:07:53.143 [rank:1] [train], epoch: 15/50, iter: 200/834, loss: 0.34353, lr: 1.210006, top1: 0.57312, throughput: 312.91 | 2022-04-11 03:07:53.151 [rank:5] [train], epoch: 15/50, iter: 200/834, loss: 0.34552, lr: 1.210006, top1: 0.56495, throughput: 313.12 | 2022-04-11 03:07:53.182 [rank:6] [train], epoch: 15/50, iter: 300/834, loss: 0.34620, lr: 1.205262, top1: 0.56547, throughput: 313.97 | 2022-04-11 03:08:54.296 [rank:5] [train], epoch: 15/50, iter: 300/834, loss: 0.34524, lr: 1.205262, top1: 0.56302, throughput: 314.00 | 2022-04-11 03:08:54.330 [rank:4] [train], epoch: 15/50, iter: 300/834, loss: 0.34640, lr: 1.205262, top1: 0.56760, throughput: 314.13 | 2022-04-11 03:08:54.257 [rank:7] [train], epoch: 15/50, iter: 300/834, loss: 0.34622, lr: 1.205262, top1: 0.56802, throughput: 313.60 | 2022-04-11 03:08:54.359 [rank:1] [train], epoch: 15/50, iter: 300/834, loss: 0.34653, lr: 1.205262, top1: 0.56740, throughput: 313.65 | 2022-04-11 03:08:54.365 [rank:0] [train], epoch: 15/50, iter: 300/834, loss: 0.34645, lr: 1.205262, top1: 0.56781, throughput: 313.56 | 2022-04-11 03:08:54.367 [rank:2] [train], epoch: 15/50, iter: 300/834, loss: 0.34837, lr: 1.205262, top1: 0.56448, throughput: 313.47 | 2022-04-11 03:08:54.376 [rank:3] [train], epoch: 15/50, iter: 300/834, loss: 0.34242, lr: 1.205262, top1: 0.57198, throughput: 313.34 | 2022-04-11 03:08:54.405 [rank:7] [train], epoch: 15/50, iter: 400/834, loss: 0.34329, lr: 1.200493, top1: 0.57099, throughput: 314.02 | 2022-04-11 03:09:55.502 [rank:6] [train], epoch: 15/50, iter: 400/834, loss: 0.34426, lr: 1.200493, top1: 0.56911, throughput: 313.64 | 2022-04-11 03:09:55.512 [rank:5] [train], epoch: 15/50, iter: 400/834, loss: 0.34533, lr: 1.200493, top1: 0.56667, throughput: 313.79 | 2022-04-11 03:09:55.517 [rank:2] [train], epoch: 15/50, iter: 400/834, loss: 0.34467, lr: 1.200493, top1: 0.56786, throughput: 313.88 | 2022-04-11 03:09:55.545 [rank:1] [train], epoch: 15/50, iter: 400/834, loss: 0.34462, lr: 1.200493, top1: 0.56990, throughput: 313.82 | 2022-04-11 03:09:55.547 [rank:4] [train], epoch: 15/50, iter: 400/834, loss: 0.35005, lr: 1.200493, top1: 0.55224, throughput: 313.18 | 2022-04-11 03:09:55.564 [rank:3] [train], epoch: 15/50, iter: 400/834, loss: 0.34967, lr: 1.200493, top1: 0.55734, throughput: 313.87 | 2022-04-11 03:09:55.577 [rank:0] [train], epoch: 15/50, iter: 400/834, loss: 0.34565, lr: 1.200493, top1: 0.56281, throughput: 313.52 | 2022-04-11 03:09:55.607 [rank:7] [train], epoch: 15/50, iter: 500/834, loss: 0.34959, lr: 1.195700, top1: 0.56198, throughput: 312.07 | 2022-04-11 03:10:57.026 [rank:0] [train], epoch: 15/50, iter: 500/834, loss: 0.34545, lr: 1.195700, top1: 0.56406, throughput: 312.60 | 2022-04-11 03:10:57.027 [rank:6] [train], epoch: 15/50, iter: 500/834, loss: 0.34953, lr: 1.195700, top1: 0.55583, throughput: 312.11 | 2022-04-11 03:10:57.029 [rank:3] [train], epoch: 15/50, iter: 500/834, loss: 0.34550, lr: 1.195700, top1: 0.56276, throughput: 312.39 | 2022-04-11 03:10:57.037 [rank:1] [train], epoch: 15/50, iter: 500/834, loss: 0.34623, lr: 1.195700, top1: 0.55828, throughput: 312.12 | 2022-04-11 03:10:57.061 [rank:5] [train], epoch: 15/50, iter: 500/834, loss: 0.34908, lr: 1.195700, top1: 0.55500, throughput: 311.97 | 2022-04-11 03:10:57.062 [rank:4] [train], epoch: 15/50, iter: 500/834, loss: 0.34725, lr: 1.195700, top1: 0.56354, throughput: 312.14 | 2022-04-11 03:10:57.076 [rank:2] [train], epoch: 15/50, iter: 500/834, loss: 0.34704, lr: 1.195700, top1: 0.55651, throughput: 312.35 | 2022-04-11 03:10:57.014 [rank:4] [train], epoch: 15/50, iter: 600/834, loss: 0.34668, lr: 1.190882, top1: 0.56120, throughput: 313.73 | 2022-04-11 03:11:58.274 [rank:1] [train], epoch: 15/50, iter: 600/834, loss: 0.34570, lr: 1.190882, top1: 0.56760, throughput: 313.63 | 2022-04-11 03:11:58.281 [rank:0] [train], epoch: 15/50, iter: 600/834, loss: 0.34522, lr: 1.190882, top1: 0.57214, throughput: 313.42 | 2022-04-11 03:11:58.287 [rank:2] [train], epoch: 15/50, iter: 600/834, loss: 0.34590, lr: 1.190882, top1: 0.56125, throughput: 313.34 | 2022-04-11 03:11:58.289 [rank:5] [train], epoch: 15/50, iter: 600/834, loss: 0.34904, lr: 1.190882, top1: 0.56323, throughput: 313.56 | 2022-04-11 03:11:58.295 [rank:7] [train], epoch: 15/50, iter: 600/834, loss: 0.34556, lr: 1.190882, top1: 0.56755, throughput: 313.37 | 2022-04-11 03:11:58.295 [rank:3] [train], epoch: 15/50, iter: 600/834, loss: 0.34636, lr: 1.190882, top1: 0.56745, throughput: 313.26 | 2022-04-11 03:11:58.327 [rank:6] [train], epoch: 15/50, iter: 600/834, loss: 0.34712, lr: 1.190882, top1: 0.56469, throughput: 313.18 | 2022-04-11 03:11:58.336 [rank:5] [train], epoch: 15/50, iter: 700/834, loss: 0.34668, lr: 1.186040, top1: 0.56557, throughput: 312.48 | 2022-04-11 03:12:59.738 [rank:2] [train], epoch: 15/50, iter: 700/834, loss: 0.34603, lr: 1.186040, top1: 0.56312, throughput: 312.44 | 2022-04-11 03:12:59.740 [rank:7] [train], epoch: 15/50, iter: 700/834, loss: 0.34696, lr: 1.186040, top1: 0.56224, throughput: 312.47 | 2022-04-11 03:12:59.742 [rank:0] [train], epoch: 15/50, iter: 700/834, loss: 0.34423, lr: 1.186040, top1: 0.57062, throughput: 312.39 | 2022-04-11 03:12:59.749 [rank:4] [train], epoch: 15/50, iter: 700/834, loss: 0.34739, lr: 1.186040, top1: 0.56286, throughput: 312.07 | 2022-04-11 03:12:59.798 [rank:6] [train], epoch: 15/50, iter: 700/834, loss: 0.34851, lr: 1.186040, top1: 0.56437, throughput: 312.37 | 2022-04-11 03:12:59.802 [rank:3] [train], epoch: 15/50, iter: 700/834, loss: 0.34603, lr: 1.186040, top1: 0.57031, throughput: 312.25 | 2022-04-11 03:12:59.816 [rank:1] [train], epoch: 15/50, iter: 700/834, loss: 0.34585, lr: 1.186040, top1: 0.56510, throughput: 312.39 | 2022-04-11 03:12:59.742 [rank:0] [train], epoch: 15/50, iter: 800/834, loss: 0.34960, lr: 1.181175, top1: 0.55521, throughput: 312.66 | 2022-04-11 03:14:01.158 [rank:5] [train], epoch: 15/50, iter: 800/834, loss: 0.34547, lr: 1.181175, top1: 0.56068, throughput: 312.46 | 2022-04-11 03:14:01.186 [rank:4] [train], epoch: 15/50, iter: 800/834, loss: 0.34766, lr: 1.181175, top1: 0.56151, throughput: 312.69 | 2022-04-11 03:14:01.202 [rank:6] [train], epoch: 15/50, iter: 800/834, loss: 0.34762, lr: 1.181175, top1: 0.56469, throughput: 312.63 | 2022-04-11 03:14:01.216 [rank:3] [train], epoch: 15/50, iter: 800/834, loss: 0.34402, lr: 1.181175, top1: 0.56943, throughput: 312.69 | 2022-04-11 03:14:01.218 [rank:1] [train], epoch: 15/50, iter: 800/834, loss: 0.34518, lr: 1.181175, top1: 0.56750, throughput: 312.23 | 2022-04-11 03:14:01.235 [rank:7] [train], epoch: 15/50, iter: 800/834, loss: 0.34773, lr: 1.181175, top1: 0.56120, throughput: 312.66 | 2022-04-11 03:14:01.150 [rank:2] [train], epoch: 15/50, iter: 800/834, loss: 0.34726, lr: 1.181175, top1: 0.56146, throughput: 312.14 | 2022-04-11 03:14:01.251 [rank:6] [train], epoch: 15/50, iter: 834/834, loss: 0.34750, lr: 1.179515, top1: 0.56097, throughput: 310.31 | 2022-04-11 03:14:22.253 [rank:7] [train], epoch: 15/50, iter: 834/834, loss: 0.34743, lr: 1.179515, top1: 0.56863, throughput: 309.29 | 2022-04-11 03:14:22.256 [rank:3] [train], epoch: 15/50, iter: 834/834, loss: 0.34818, lr: 1.179515, top1: 0.56143, throughput: 310.21 | 2022-04-11 03:14:22.262 [rank:2] [train], epoch: 15/50, iter: 834/834, loss: 0.34704, lr: 1.179515, top1: 0.56036, throughput: 310.66 | 2022-04-11 03:14:22.264 [rank:0] [train], epoch: 15/50, iter: 834/834, loss: 0.34849, lr: 1.179515, top1: 0.56158, throughput: 309.26 | 2022-04-11 03:14:22.267 [rank:4] [train], epoch: 15/50, iter: 834/834, loss: 0.34257, lr: 1.179515, top1: 0.57169, throughput: 309.90 | 2022-04-11 03:14:22.267 [rank:1] [train], epoch: 15/50, iter: 834/834, loss: 0.34822, lr: 1.179515, top1: 0.55775, throughput: 310.36 | 2022-04-11 03:14:22.268 [rank:5] [train], epoch: 15/50, iter: 834/834, loss: 0.34508, lr: 1.179515, top1: 0.57552, throughput: 309.65 | 2022-04-11 03:14:22.269 [rank:0] [eval], epoch: 15/50, iter: 125/125, loss: 0.00000, lr: 1.179515, top1: 0.56448, throughput: 489.95 | 2022-04-11 03:14:35.023 [rank:2] [eval], epoch: 15/50, iter: 125/125, loss: 0.00000, lr: 1.179515, top1: 0.56496, throughput: 489.61 | 2022-04-11 03:14:35.030 [rank:4] [eval], epoch: 15/50, iter: 125/125, loss: 0.00000, lr: 1.179515, top1: 0.56880, throughput: 489.61 | 2022-04-11 03:14:35.032 [rank:6] [eval], epoch: 15/50, iter: 125/125, loss: 0.00000, lr: 1.179515, top1: 0.56624, throughput: 489.05 | 2022-04-11 03:14:35.033 [rank:7] [eval], epoch: 15/50, iter: 125/125, loss: 0.00000, lr: 1.179515, top1: 0.57856, throughput: 489.04 | 2022-04-11 03:14:35.036 [rank:5] [eval], epoch: 15/50, iter: 125/125, loss: 0.00000, lr: 1.179515, top1: 0.56640, throughput: 489.49 | 2022-04-11 03:14:35.037 [rank:3] [eval], epoch: 15/50, iter: 125/125, loss: 0.00000, lr: 1.179515, top1: 0.55952, throughput: 488.40 | 2022-04-11 03:14:35.059 [rank:1] [eval], epoch: 15/50, iter: 125/125, loss: 0.00000, lr: 1.179515, top1: 0.57408, throughput: 487.69 | 2022-04-11 03:14:35.084 [rank:2] [train], epoch: 16/50, iter: 100/834, loss: 0.33903, lr: 1.174618, top1: 0.57849, throughput: 310.15 | 2022-04-11 03:15:36.936 [rank:1] [train], epoch: 16/50, iter: 100/834, loss: 0.34332, lr: 1.174618, top1: 0.56854, throughput: 310.36 | 2022-04-11 03:15:36.948 [rank:4] [train], epoch: 16/50, iter: 100/834, loss: 0.33831, lr: 1.174618, top1: 0.58031, throughput: 310.10 | 2022-04-11 03:15:36.948 [rank:0] [train], epoch: 16/50, iter: 100/834, loss: 0.33886, lr: 1.174618, top1: 0.57677, throughput: 310.03 | 2022-04-11 03:15:36.953 [rank:5] [train], epoch: 16/50, iter: 100/834, loss: 0.34158, lr: 1.174618, top1: 0.57109, throughput: 310.23 | 2022-04-11 03:15:36.926 [rank:7] [train], epoch: 16/50, iter: 100/834, loss: 0.34204, lr: 1.174618, top1: 0.57073, throughput: 309.86 | 2022-04-11 03:15:37.001 [rank:6] [train], epoch: 16/50, iter: 100/834, loss: 0.33700, lr: 1.174618, top1: 0.58234, throughput: 309.82 | 2022-04-11 03:15:37.005 [rank:3] [train], epoch: 16/50, iter: 100/834, loss: 0.34049, lr: 1.174618, top1: 0.57620, throughput: 310.25 | 2022-04-11 03:15:36.946 [rank:6] [train], epoch: 16/50, iter: 200/834, loss: 0.34044, lr: 1.169698, top1: 0.57516, throughput: 314.13 | 2022-04-11 03:16:38.127 [rank:4] [train], epoch: 16/50, iter: 200/834, loss: 0.34457, lr: 1.169698, top1: 0.56807, throughput: 313.83 | 2022-04-11 03:16:38.128 [rank:1] [train], epoch: 16/50, iter: 200/834, loss: 0.34298, lr: 1.169698, top1: 0.57005, throughput: 313.75 | 2022-04-11 03:16:38.142 [rank:7] [train], epoch: 16/50, iter: 200/834, loss: 0.33943, lr: 1.169698, top1: 0.57833, throughput: 314.02 | 2022-04-11 03:16:38.143 [rank:5] [train], epoch: 16/50, iter: 200/834, loss: 0.34382, lr: 1.169698, top1: 0.57479, throughput: 313.43 | 2022-04-11 03:16:38.183 [rank:3] [train], epoch: 16/50, iter: 200/834, loss: 0.34055, lr: 1.169698, top1: 0.57901, throughput: 313.51 | 2022-04-11 03:16:38.188 [rank:2] [train], epoch: 16/50, iter: 200/834, loss: 0.34005, lr: 1.169698, top1: 0.57687, throughput: 313.44 | 2022-04-11 03:16:38.191 [rank:0] [train], epoch: 16/50, iter: 200/834, loss: 0.34300, lr: 1.169698, top1: 0.56953, throughput: 313.36 | 2022-04-11 03:16:38.224 [rank:3] [train], epoch: 16/50, iter: 300/834, loss: 0.34401, lr: 1.164755, top1: 0.56766, throughput: 315.10 | 2022-04-11 03:17:39.121 [rank:6] [train], epoch: 16/50, iter: 300/834, loss: 0.34190, lr: 1.164755, top1: 0.57521, throughput: 314.73 | 2022-04-11 03:17:39.132 [rank:5] [train], epoch: 16/50, iter: 300/834, loss: 0.33887, lr: 1.164755, top1: 0.57755, throughput: 315.02 | 2022-04-11 03:17:39.132 [rank:0] [train], epoch: 16/50, iter: 300/834, loss: 0.34057, lr: 1.164755, top1: 0.57224, throughput: 315.22 | 2022-04-11 03:17:39.135 [rank:7] [train], epoch: 16/50, iter: 300/834, loss: 0.34301, lr: 1.164755, top1: 0.56833, throughput: 314.53 | 2022-04-11 03:17:39.187 [rank:1] [train], epoch: 16/50, iter: 300/834, loss: 0.34152, lr: 1.164755, top1: 0.57484, throughput: 314.98 | 2022-04-11 03:17:39.098 [rank:4] [train], epoch: 16/50, iter: 300/834, loss: 0.34318, lr: 1.164755, top1: 0.57125, throughput: 314.87 | 2022-04-11 03:17:39.105 [rank:2] [train], epoch: 16/50, iter: 300/834, loss: 0.34221, lr: 1.164755, top1: 0.56969, throughput: 314.63 | 2022-04-11 03:17:39.215 [rank:5] [train], epoch: 16/50, iter: 400/834, loss: 0.34069, lr: 1.159790, top1: 0.57271, throughput: 314.07 | 2022-04-11 03:18:40.264 [rank:0] [train], epoch: 16/50, iter: 400/834, loss: 0.34357, lr: 1.159790, top1: 0.57240, throughput: 314.02 | 2022-04-11 03:18:40.278 [rank:2] [train], epoch: 16/50, iter: 400/834, loss: 0.34272, lr: 1.159790, top1: 0.57130, throughput: 314.26 | 2022-04-11 03:18:40.310 [rank:7] [train], epoch: 16/50, iter: 400/834, loss: 0.33903, lr: 1.159790, top1: 0.57797, throughput: 314.08 | 2022-04-11 03:18:40.317 [rank:3] [train], epoch: 16/50, iter: 400/834, loss: 0.34228, lr: 1.159790, top1: 0.57172, throughput: 313.70 | 2022-04-11 03:18:40.325 [rank:6] [train], epoch: 16/50, iter: 400/834, loss: 0.34108, lr: 1.159790, top1: 0.57703, throughput: 314.18 | 2022-04-11 03:18:40.242 [rank:1] [train], epoch: 16/50, iter: 400/834, loss: 0.34304, lr: 1.159790, top1: 0.56854, throughput: 313.55 | 2022-04-11 03:18:40.332 [rank:4] [train], epoch: 16/50, iter: 400/834, loss: 0.34334, lr: 1.159790, top1: 0.56948, throughput: 313.91 | 2022-04-11 03:18:40.270 [rank:1] [train], epoch: 16/50, iter: 500/834, loss: 0.34322, lr: 1.154803, top1: 0.57063, throughput: 314.09 | 2022-04-11 03:19:41.462 [rank:4] [train], epoch: 16/50, iter: 500/834, loss: 0.34114, lr: 1.154803, top1: 0.57432, throughput: 313.69 | 2022-04-11 03:19:41.477 [rank:6] [train], epoch: 16/50, iter: 500/834, loss: 0.34634, lr: 1.154803, top1: 0.56474, throughput: 313.49 | 2022-04-11 03:19:41.488 [rank:7] [train], epoch: 16/50, iter: 500/834, loss: 0.34346, lr: 1.154803, top1: 0.57417, throughput: 313.85 | 2022-04-11 03:19:41.494 [rank:5] [train], epoch: 16/50, iter: 500/834, loss: 0.34621, lr: 1.154803, top1: 0.56755, throughput: 313.57 | 2022-04-11 03:19:41.495 [rank:3] [train], epoch: 16/50, iter: 500/834, loss: 0.34399, lr: 1.154803, top1: 0.56693, throughput: 313.78 | 2022-04-11 03:19:41.514 [rank:0] [train], epoch: 16/50, iter: 500/834, loss: 0.34367, lr: 1.154803, top1: 0.56932, throughput: 313.54 | 2022-04-11 03:19:41.515 [rank:2] [train], epoch: 16/50, iter: 500/834, loss: 0.34400, lr: 1.154803, top1: 0.57417, throughput: 314.05 | 2022-04-11 03:19:41.447 [rank:7] [train], epoch: 16/50, iter: 600/834, loss: 0.34374, lr: 1.149793, top1: 0.56755, throughput: 313.06 | 2022-04-11 03:20:42.824 [rank:4] [train], epoch: 16/50, iter: 600/834, loss: 0.34508, lr: 1.149793, top1: 0.56656, throughput: 312.96 | 2022-04-11 03:20:42.827 [rank:5] [train], epoch: 16/50, iter: 600/834, loss: 0.34234, lr: 1.149793, top1: 0.56938, throughput: 313.02 | 2022-04-11 03:20:42.834 [rank:6] [train], epoch: 16/50, iter: 600/834, loss: 0.34025, lr: 1.149793, top1: 0.57776, throughput: 312.94 | 2022-04-11 03:20:42.842 [rank:1] [train], epoch: 16/50, iter: 600/834, loss: 0.34335, lr: 1.149793, top1: 0.56781, throughput: 312.70 | 2022-04-11 03:20:42.862 [rank:0] [train], epoch: 16/50, iter: 600/834, loss: 0.34503, lr: 1.149793, top1: 0.56490, throughput: 312.95 | 2022-04-11 03:20:42.867 [rank:3] [train], epoch: 16/50, iter: 600/834, loss: 0.34465, lr: 1.149793, top1: 0.56172, throughput: 312.90 | 2022-04-11 03:20:42.876 [rank:2] [train], epoch: 16/50, iter: 600/834, loss: 0.34482, lr: 1.149793, top1: 0.56849, throughput: 312.42 | 2022-04-11 03:20:42.902 [rank:7] [train], epoch: 16/50, iter: 700/834, loss: 0.34315, lr: 1.144762, top1: 0.57036, throughput: 311.94 | 2022-04-11 03:21:44.375 [rank:6] [train], epoch: 16/50, iter: 700/834, loss: 0.34140, lr: 1.144762, top1: 0.57349, throughput: 311.89 | 2022-04-11 03:21:44.402 [rank:5] [train], epoch: 16/50, iter: 700/834, loss: 0.34472, lr: 1.144762, top1: 0.57172, throughput: 311.75 | 2022-04-11 03:21:44.421 [rank:2] [train], epoch: 16/50, iter: 700/834, loss: 0.34567, lr: 1.144762, top1: 0.57010, throughput: 312.09 | 2022-04-11 03:21:44.423 [rank:4] [train], epoch: 16/50, iter: 700/834, loss: 0.34297, lr: 1.144762, top1: 0.57219, throughput: 311.69 | 2022-04-11 03:21:44.426 [rank:1] [train], epoch: 16/50, iter: 700/834, loss: 0.34188, lr: 1.144762, top1: 0.57193, throughput: 311.83 | 2022-04-11 03:21:44.435 [rank:3] [train], epoch: 16/50, iter: 700/834, loss: 0.34249, lr: 1.144762, top1: 0.57255, throughput: 311.82 | 2022-04-11 03:21:44.450 [rank:0] [train], epoch: 16/50, iter: 700/834, loss: 0.34665, lr: 1.144762, top1: 0.56057, throughput: 311.71 | 2022-04-11 03:21:44.463 [rank:5] [train], epoch: 16/50, iter: 800/834, loss: 0.34498, lr: 1.139709, top1: 0.56729, throughput: 313.69 | 2022-04-11 03:22:45.628 [rank:7] [train], epoch: 16/50, iter: 800/834, loss: 0.34352, lr: 1.139709, top1: 0.57052, throughput: 313.39 | 2022-04-11 03:22:45.640 [rank:6] [train], epoch: 16/50, iter: 800/834, loss: 0.34305, lr: 1.139709, top1: 0.57531, throughput: 313.53 | 2022-04-11 03:22:45.640 [rank:1] [train], epoch: 16/50, iter: 800/834, loss: 0.34406, lr: 1.139709, top1: 0.56651, throughput: 313.60 | 2022-04-11 03:22:45.658 [rank:0] [train], epoch: 16/50, iter: 800/834, loss: 0.34303, lr: 1.139709, top1: 0.57073, throughput: 313.69 | 2022-04-11 03:22:45.670 [rank:4] [train], epoch: 16/50, iter: 800/834, loss: 0.34509, lr: 1.139709, top1: 0.56708, throughput: 313.50 | 2022-04-11 03:22:45.671 [rank:2] [train], epoch: 16/50, iter: 800/834, loss: 0.34106, lr: 1.139709, top1: 0.57484, throughput: 313.44 | 2022-04-11 03:22:45.678 [rank:3] [train], epoch: 16/50, iter: 800/834, loss: 0.34179, lr: 1.139709, top1: 0.56870, throughput: 313.43 | 2022-04-11 03:22:45.707 [rank:5] [train], epoch: 16/50, iter: 834/834, loss: 0.34713, lr: 1.137987, top1: 0.56633, throughput: 312.11 | 2022-04-11 03:23:06.544 [rank:6] [train], epoch: 16/50, iter: 834/834, loss: 0.34310, lr: 1.137987, top1: 0.57215, throughput: 312.30 | 2022-04-11 03:23:06.544 [rank:4] [train], epoch: 16/50, iter: 834/834, loss: 0.34195, lr: 1.137987, top1: 0.57138, throughput: 312.73 | 2022-04-11 03:23:06.545 [rank:2] [train], epoch: 16/50, iter: 834/834, loss: 0.34610, lr: 1.137987, top1: 0.56725, throughput: 312.69 | 2022-04-11 03:23:06.555 [rank:7] [train], epoch: 16/50, iter: 834/834, loss: 0.34370, lr: 1.137987, top1: 0.56419, throughput: 312.12 | 2022-04-11 03:23:06.555 [rank:1] [train], epoch: 16/50, iter: 834/834, loss: 0.34295, lr: 1.137987, top1: 0.56756, throughput: 312.34 | 2022-04-11 03:23:06.559 [rank:3] [train], epoch: 16/50, iter: 834/834, loss: 0.34046, lr: 1.137987, top1: 0.57154, throughput: 312.98 | 2022-04-11 03:23:06.565 [rank:0] [train], epoch: 16/50, iter: 834/834, loss: 0.34742, lr: 1.137987, top1: 0.56801, throughput: 311.88 | 2022-04-11 03:23:06.601 [rank:0] [eval], epoch: 16/50, iter: 125/125, loss: 0.00000, lr: 1.137987, top1: 0.57168, throughput: 492.53 | 2022-04-11 03:23:19.291 [rank:2] [eval], epoch: 16/50, iter: 125/125, loss: 0.00000, lr: 1.137987, top1: 0.56144, throughput: 490.55 | 2022-04-11 03:23:19.296 [rank:7] [eval], epoch: 16/50, iter: 125/125, loss: 0.00000, lr: 1.137987, top1: 0.56960, throughput: 489.72 | 2022-04-11 03:23:19.317 [rank:1] [eval], epoch: 16/50, iter: 125/125, loss: 0.00000, lr: 1.137987, top1: 0.57872, throughput: 489.52 | 2022-04-11 03:23:19.326 [rank:4] [eval], epoch: 16/50, iter: 125/125, loss: 0.00000, lr: 1.137987, top1: 0.56944, throughput: 488.78 | 2022-04-11 03:23:19.332 [rank:6] [eval], epoch: 16/50, iter: 125/125, loss: 0.00000, lr: 1.137987, top1: 0.57072, throughput: 488.59 | 2022-04-11 03:23:19.335 [rank:3] [eval], epoch: 16/50, iter: 125/125, loss: 0.00000, lr: 1.137987, top1: 0.57184, throughput: 489.30 | 2022-04-11 03:23:19.338 [rank:5] [eval], epoch: 16/50, iter: 125/125, loss: 0.00000, lr: 1.137987, top1: 0.56112, throughput: 488.25 | 2022-04-11 03:23:19.344 [rank:2] [train], epoch: 17/50, iter: 100/834, loss: 0.33404, lr: 1.132906, top1: 0.59078, throughput: 314.01 | 2022-04-11 03:24:20.441 [rank:7] [train], epoch: 17/50, iter: 100/834, loss: 0.34067, lr: 1.132906, top1: 0.57677, throughput: 313.92 | 2022-04-11 03:24:20.479 [rank:3] [train], epoch: 17/50, iter: 100/834, loss: 0.33711, lr: 1.132906, top1: 0.58370, throughput: 314.02 | 2022-04-11 03:24:20.480 [rank:0] [train], epoch: 17/50, iter: 100/834, loss: 0.33236, lr: 1.132906, top1: 0.59036, throughput: 313.74 | 2022-04-11 03:24:20.488 [rank:5] [train], epoch: 17/50, iter: 100/834, loss: 0.33587, lr: 1.132906, top1: 0.58068, throughput: 314.01 | 2022-04-11 03:24:20.489 [rank:1] [train], epoch: 17/50, iter: 100/834, loss: 0.33773, lr: 1.132906, top1: 0.57656, throughput: 313.91 | 2022-04-11 03:24:20.490 [rank:6] [train], epoch: 17/50, iter: 100/834, loss: 0.33647, lr: 1.132906, top1: 0.58073, throughput: 313.93 | 2022-04-11 03:24:20.496 [rank:4] [train], epoch: 17/50, iter: 100/834, loss: 0.33782, lr: 1.132906, top1: 0.58349, throughput: 313.76 | 2022-04-11 03:24:20.525 [rank:2] [train], epoch: 17/50, iter: 200/834, loss: 0.33815, lr: 1.127805, top1: 0.58208, throughput: 313.29 | 2022-04-11 03:25:21.726 [rank:1] [train], epoch: 17/50, iter: 200/834, loss: 0.33655, lr: 1.127805, top1: 0.58292, throughput: 313.53 | 2022-04-11 03:25:21.727 [rank:4] [train], epoch: 17/50, iter: 200/834, loss: 0.33868, lr: 1.127805, top1: 0.57865, throughput: 313.55 | 2022-04-11 03:25:21.759 [rank:6] [train], epoch: 17/50, iter: 200/834, loss: 0.33924, lr: 1.127805, top1: 0.57755, throughput: 313.36 | 2022-04-11 03:25:21.767 [rank:5] [train], epoch: 17/50, iter: 200/834, loss: 0.33783, lr: 1.127805, top1: 0.57635, throughput: 313.24 | 2022-04-11 03:25:21.784 [rank:3] [train], epoch: 17/50, iter: 200/834, loss: 0.33808, lr: 1.127805, top1: 0.58245, throughput: 313.09 | 2022-04-11 03:25:21.803 [rank:7] [train], epoch: 17/50, iter: 200/834, loss: 0.33594, lr: 1.127805, top1: 0.58026, throughput: 313.02 | 2022-04-11 03:25:21.817 [rank:0] [train], epoch: 17/50, iter: 200/834, loss: 0.33910, lr: 1.127805, top1: 0.58021, throughput: 313.01 | 2022-04-11 03:25:21.828 [rank:6] [train], epoch: 17/50, iter: 300/834, loss: 0.33779, lr: 1.122683, top1: 0.57839, throughput: 313.99 | 2022-04-11 03:26:22.915 [rank:1] [train], epoch: 17/50, iter: 300/834, loss: 0.33727, lr: 1.122683, top1: 0.58047, throughput: 314.06 | 2022-04-11 03:26:22.862 [rank:2] [train], epoch: 17/50, iter: 300/834, loss: 0.34006, lr: 1.122683, top1: 0.57151, throughput: 313.69 | 2022-04-11 03:26:22.932 [rank:4] [train], epoch: 17/50, iter: 300/834, loss: 0.33445, lr: 1.122683, top1: 0.58656, throughput: 313.81 | 2022-04-11 03:26:22.942 [rank:5] [train], epoch: 17/50, iter: 300/834, loss: 0.33709, lr: 1.122683, top1: 0.58203, throughput: 314.25 | 2022-04-11 03:26:22.883 [rank:7] [train], epoch: 17/50, iter: 300/834, loss: 0.33844, lr: 1.122683, top1: 0.57771, throughput: 314.42 | 2022-04-11 03:26:22.882 [rank:3] [train], epoch: 17/50, iter: 300/834, loss: 0.33955, lr: 1.122683, top1: 0.57510, throughput: 313.87 | 2022-04-11 03:26:22.975 [rank:0] [train], epoch: 17/50, iter: 300/834, loss: 0.34189, lr: 1.122683, top1: 0.57094, throughput: 314.37 | 2022-04-11 03:26:22.902 [rank:1] [train], epoch: 17/50, iter: 400/834, loss: 0.34404, lr: 1.117541, top1: 0.57073, throughput: 311.85 | 2022-04-11 03:27:24.430 [rank:6] [train], epoch: 17/50, iter: 400/834, loss: 0.33860, lr: 1.117541, top1: 0.57792, throughput: 312.06 | 2022-04-11 03:27:24.441 [rank:5] [train], epoch: 17/50, iter: 400/834, loss: 0.34231, lr: 1.117541, top1: 0.57109, throughput: 311.89 | 2022-04-11 03:27:24.442 [rank:4] [train], epoch: 17/50, iter: 400/834, loss: 0.34191, lr: 1.117541, top1: 0.57057, throughput: 312.15 | 2022-04-11 03:27:24.451 [rank:3] [train], epoch: 17/50, iter: 400/834, loss: 0.33722, lr: 1.117541, top1: 0.58630, throughput: 312.26 | 2022-04-11 03:27:24.463 [rank:2] [train], epoch: 17/50, iter: 400/834, loss: 0.34309, lr: 1.117541, top1: 0.57005, throughput: 312.03 | 2022-04-11 03:27:24.466 [rank:0] [train], epoch: 17/50, iter: 400/834, loss: 0.34037, lr: 1.117541, top1: 0.57271, throughput: 311.78 | 2022-04-11 03:27:24.484 [rank:7] [train], epoch: 17/50, iter: 400/834, loss: 0.34021, lr: 1.117541, top1: 0.57734, throughput: 311.62 | 2022-04-11 03:27:24.495 [rank:2] [train], epoch: 17/50, iter: 500/834, loss: 0.33980, lr: 1.112379, top1: 0.57297, throughput: 312.04 | 2022-04-11 03:28:25.996 [rank:7] [train], epoch: 17/50, iter: 500/834, loss: 0.33933, lr: 1.112379, top1: 0.57714, throughput: 312.18 | 2022-04-11 03:28:25.998 [rank:6] [train], epoch: 17/50, iter: 500/834, loss: 0.34051, lr: 1.112379, top1: 0.57563, throughput: 311.68 | 2022-04-11 03:28:26.042 [rank:5] [train], epoch: 17/50, iter: 500/834, loss: 0.34271, lr: 1.112379, top1: 0.57005, throughput: 311.68 | 2022-04-11 03:28:26.044 [rank:1] [train], epoch: 17/50, iter: 500/834, loss: 0.33876, lr: 1.112379, top1: 0.57896, throughput: 311.57 | 2022-04-11 03:28:26.053 [rank:4] [train], epoch: 17/50, iter: 500/834, loss: 0.33886, lr: 1.112379, top1: 0.57568, throughput: 311.66 | 2022-04-11 03:28:26.056 [rank:0] [train], epoch: 17/50, iter: 500/834, loss: 0.34019, lr: 1.112379, top1: 0.57422, throughput: 311.76 | 2022-04-11 03:28:26.069 [rank:3] [train], epoch: 17/50, iter: 500/834, loss: 0.33771, lr: 1.112379, top1: 0.57917, throughput: 311.54 | 2022-04-11 03:28:26.091 [rank:1] [train], epoch: 17/50, iter: 600/834, loss: 0.33838, lr: 1.107198, top1: 0.57812, throughput: 313.84 | 2022-04-11 03:29:27.231 [rank:2] [train], epoch: 17/50, iter: 600/834, loss: 0.33977, lr: 1.107198, top1: 0.57906, throughput: 313.39 | 2022-04-11 03:29:27.262 [rank:6] [train], epoch: 17/50, iter: 600/834, loss: 0.34189, lr: 1.107198, top1: 0.57031, throughput: 313.49 | 2022-04-11 03:29:27.288 [rank:4] [train], epoch: 17/50, iter: 600/834, loss: 0.34226, lr: 1.107198, top1: 0.56734, throughput: 313.53 | 2022-04-11 03:29:27.293 [rank:3] [train], epoch: 17/50, iter: 600/834, loss: 0.34079, lr: 1.107198, top1: 0.56896, throughput: 313.64 | 2022-04-11 03:29:27.307 [rank:5] [train], epoch: 17/50, iter: 600/834, loss: 0.34406, lr: 1.107198, top1: 0.56547, throughput: 313.38 | 2022-04-11 03:29:27.311 [rank:0] [train], epoch: 17/50, iter: 600/834, loss: 0.34054, lr: 1.107198, top1: 0.57734, throughput: 313.38 | 2022-04-11 03:29:27.337 [rank:7] [train], epoch: 17/50, iter: 600/834, loss: 0.33889, lr: 1.107198, top1: 0.57604, throughput: 313.44 | 2022-04-11 03:29:27.255 [rank:6] [train], epoch: 17/50, iter: 700/834, loss: 0.33965, lr: 1.101997, top1: 0.57625, throughput: 312.28 | 2022-04-11 03:30:28.771 [rank:7] [train], epoch: 17/50, iter: 700/834, loss: 0.33873, lr: 1.101997, top1: 0.57557, throughput: 312.07 | 2022-04-11 03:30:28.780 [rank:0] [train], epoch: 17/50, iter: 700/834, loss: 0.34157, lr: 1.101997, top1: 0.57245, throughput: 312.45 | 2022-04-11 03:30:28.786 [rank:2] [train], epoch: 17/50, iter: 700/834, loss: 0.34176, lr: 1.101997, top1: 0.57474, throughput: 312.07 | 2022-04-11 03:30:28.787 [rank:5] [train], epoch: 17/50, iter: 700/834, loss: 0.34022, lr: 1.101997, top1: 0.57594, throughput: 312.31 | 2022-04-11 03:30:28.789 [rank:3] [train], epoch: 17/50, iter: 700/834, loss: 0.34011, lr: 1.101997, top1: 0.57792, throughput: 312.21 | 2022-04-11 03:30:28.803 [rank:1] [train], epoch: 17/50, iter: 700/834, loss: 0.34223, lr: 1.101997, top1: 0.57437, throughput: 311.71 | 2022-04-11 03:30:28.828 [rank:4] [train], epoch: 17/50, iter: 700/834, loss: 0.33955, lr: 1.101997, top1: 0.57479, throughput: 311.98 | 2022-04-11 03:30:28.835 [rank:5] [train], epoch: 17/50, iter: 800/834, loss: 0.34012, lr: 1.096777, top1: 0.57526, throughput: 313.56 | 2022-04-11 03:31:30.022 [rank:1] [train], epoch: 17/50, iter: 800/834, loss: 0.33862, lr: 1.096777, top1: 0.57880, throughput: 313.68 | 2022-04-11 03:31:30.036 [rank:2] [train], epoch: 17/50, iter: 800/834, loss: 0.34383, lr: 1.096777, top1: 0.56677, throughput: 313.46 | 2022-04-11 03:31:30.039 [rank:0] [train], epoch: 17/50, iter: 800/834, loss: 0.34116, lr: 1.096777, top1: 0.57047, throughput: 313.39 | 2022-04-11 03:31:30.051 [rank:4] [train], epoch: 17/50, iter: 800/834, loss: 0.33940, lr: 1.096777, top1: 0.58125, throughput: 313.62 | 2022-04-11 03:31:30.055 [rank:6] [train], epoch: 17/50, iter: 800/834, loss: 0.34105, lr: 1.096777, top1: 0.57615, throughput: 313.16 | 2022-04-11 03:31:30.081 [rank:3] [train], epoch: 17/50, iter: 800/834, loss: 0.33956, lr: 1.096777, top1: 0.57479, throughput: 313.25 | 2022-04-11 03:31:30.095 [rank:7] [train], epoch: 17/50, iter: 800/834, loss: 0.33962, lr: 1.096777, top1: 0.57771, throughput: 313.05 | 2022-04-11 03:31:30.112 [rank:1] [train], epoch: 17/50, iter: 834/834, loss: 0.33884, lr: 1.094998, top1: 0.57843, throughput: 308.10 | 2022-04-11 03:31:51.224 [rank:4] [train], epoch: 17/50, iter: 834/834, loss: 0.34206, lr: 1.094998, top1: 0.57537, throughput: 308.03 | 2022-04-11 03:31:51.247 [rank:6] [train], epoch: 17/50, iter: 834/834, loss: 0.33919, lr: 1.094998, top1: 0.57705, throughput: 308.37 | 2022-04-11 03:31:51.251 [rank:3] [train], epoch: 17/50, iter: 834/834, loss: 0.33560, lr: 1.094998, top1: 0.58624, throughput: 308.52 | 2022-04-11 03:31:51.254 [rank:2] [train], epoch: 17/50, iter: 834/834, loss: 0.33900, lr: 1.094998, top1: 0.57705, throughput: 307.58 | 2022-04-11 03:31:51.263 [rank:7] [train], epoch: 17/50, iter: 834/834, loss: 0.33810, lr: 1.094998, top1: 0.57675, throughput: 308.42 | 2022-04-11 03:31:51.277 [rank:0] [train], epoch: 17/50, iter: 834/834, loss: 0.34416, lr: 1.094998, top1: 0.57246, throughput: 307.38 | 2022-04-11 03:31:51.288 [rank:5] [train], epoch: 17/50, iter: 834/834, loss: 0.34119, lr: 1.094998, top1: 0.57031, throughput: 306.61 | 2022-04-11 03:31:51.312 [rank:0] [eval], epoch: 17/50, iter: 125/125, loss: 0.00000, lr: 1.094998, top1: 0.59472, throughput: 491.21 | 2022-04-11 03:32:04.012 [rank:1] [eval], epoch: 17/50, iter: 125/125, loss: 0.00000, lr: 1.094998, top1: 0.58912, throughput: 488.69 | 2022-04-11 03:32:04.014 [rank:2] [eval], epoch: 17/50, iter: 125/125, loss: 0.00000, lr: 1.094998, top1: 0.58080, throughput: 489.74 | 2022-04-11 03:32:04.025 [rank:7] [eval], epoch: 17/50, iter: 125/125, loss: 0.00000, lr: 1.094998, top1: 0.58736, throughput: 490.18 | 2022-04-11 03:32:04.028 [rank:3] [eval], epoch: 17/50, iter: 125/125, loss: 0.00000, lr: 1.094998, top1: 0.58336, throughput: 489.26 | 2022-04-11 03:32:04.029 [rank:4] [eval], epoch: 17/50, iter: 125/125, loss: 0.00000, lr: 1.094998, top1: 0.58400, throughput: 488.90 | 2022-04-11 03:32:04.031 [rank:6] [eval], epoch: 17/50, iter: 125/125, loss: 0.00000, lr: 1.094998, top1: 0.58272, throughput: 488.96 | 2022-04-11 03:32:04.033 [rank:5] [eval], epoch: 17/50, iter: 125/125, loss: 0.00000, lr: 1.094998, top1: 0.57344, throughput: 490.24 | 2022-04-11 03:32:04.061 [rank:4] [train], epoch: 18/50, iter: 100/834, loss: 0.33371, lr: 1.089754, top1: 0.58578, throughput: 312.26 | 2022-04-11 03:33:05.519 [rank:1] [train], epoch: 18/50, iter: 100/834, loss: 0.33313, lr: 1.089754, top1: 0.58891, throughput: 312.10 | 2022-04-11 03:33:05.533 [rank:0] [train], epoch: 18/50, iter: 100/834, loss: 0.33361, lr: 1.089754, top1: 0.58552, throughput: 312.05 | 2022-04-11 03:33:05.540 [rank:2] [train], epoch: 18/50, iter: 100/834, loss: 0.33285, lr: 1.089754, top1: 0.58812, throughput: 312.12 | 2022-04-11 03:33:05.540 [rank:7] [train], epoch: 18/50, iter: 100/834, loss: 0.33287, lr: 1.089754, top1: 0.59042, throughput: 312.08 | 2022-04-11 03:33:05.551 [rank:5] [train], epoch: 18/50, iter: 100/834, loss: 0.33472, lr: 1.089754, top1: 0.58172, throughput: 312.25 | 2022-04-11 03:33:05.551 [rank:6] [train], epoch: 18/50, iter: 100/834, loss: 0.33101, lr: 1.089754, top1: 0.59266, throughput: 312.10 | 2022-04-11 03:33:05.552 [rank:3] [train], epoch: 18/50, iter: 100/834, loss: 0.33056, lr: 1.089754, top1: 0.59203, throughput: 312.01 | 2022-04-11 03:33:05.565 [rank:4] [train], epoch: 18/50, iter: 200/834, loss: 0.33749, lr: 1.084491, top1: 0.58547, throughput: 314.04 | 2022-04-11 03:34:06.657 [rank:1] [train], epoch: 18/50, iter: 200/834, loss: 0.33515, lr: 1.084491, top1: 0.58609, throughput: 314.00 | 2022-04-11 03:34:06.680 [rank:3] [train], epoch: 18/50, iter: 200/834, loss: 0.33480, lr: 1.084491, top1: 0.58323, throughput: 314.16 | 2022-04-11 03:34:06.681 [rank:2] [train], epoch: 18/50, iter: 200/834, loss: 0.33549, lr: 1.084491, top1: 0.58318, throughput: 313.94 | 2022-04-11 03:34:06.699 [rank:5] [train], epoch: 18/50, iter: 200/834, loss: 0.33690, lr: 1.084491, top1: 0.58094, throughput: 313.96 | 2022-04-11 03:34:06.706 [rank:0] [train], epoch: 18/50, iter: 200/834, loss: 0.33167, lr: 1.084491, top1: 0.58703, throughput: 313.73 | 2022-04-11 03:34:06.738 [rank:6] [train], epoch: 18/50, iter: 200/834, loss: 0.33261, lr: 1.084491, top1: 0.59073, throughput: 314.25 | 2022-04-11 03:34:06.650 [rank:7] [train], epoch: 18/50, iter: 200/834, loss: 0.33548, lr: 1.084491, top1: 0.58125, throughput: 314.04 | 2022-04-11 03:34:06.690 [rank:2] [train], epoch: 18/50, iter: 300/834, loss: 0.33703, lr: 1.079210, top1: 0.57969, throughput: 311.84 | 2022-04-11 03:35:08.270 [rank:6] [train], epoch: 18/50, iter: 300/834, loss: 0.33732, lr: 1.079210, top1: 0.58010, throughput: 311.48 | 2022-04-11 03:35:08.292 [rank:3] [train], epoch: 18/50, iter: 300/834, loss: 0.33574, lr: 1.079210, top1: 0.58495, throughput: 311.44 | 2022-04-11 03:35:08.330 [rank:4] [train], epoch: 18/50, iter: 300/834, loss: 0.33522, lr: 1.079210, top1: 0.58333, throughput: 311.28 | 2022-04-11 03:35:08.338 [rank:7] [train], epoch: 18/50, iter: 300/834, loss: 0.33937, lr: 1.079210, top1: 0.57771, throughput: 311.37 | 2022-04-11 03:35:08.354 [rank:1] [train], epoch: 18/50, iter: 300/834, loss: 0.33677, lr: 1.079210, top1: 0.58495, throughput: 311.25 | 2022-04-11 03:35:08.367 [rank:5] [train], epoch: 18/50, iter: 300/834, loss: 0.33283, lr: 1.079210, top1: 0.58771, throughput: 311.30 | 2022-04-11 03:35:08.382 [rank:0] [train], epoch: 18/50, iter: 300/834, loss: 0.33596, lr: 1.079210, top1: 0.58641, throughput: 311.21 | 2022-04-11 03:35:08.433 [rank:1] [train], epoch: 18/50, iter: 400/834, loss: 0.33853, lr: 1.073912, top1: 0.57547, throughput: 313.48 | 2022-04-11 03:36:09.614 [rank:4] [train], epoch: 18/50, iter: 400/834, loss: 0.33285, lr: 1.073912, top1: 0.59260, throughput: 313.30 | 2022-04-11 03:36:09.621 [rank:0] [train], epoch: 18/50, iter: 400/834, loss: 0.33750, lr: 1.073912, top1: 0.57568, throughput: 313.78 | 2022-04-11 03:36:09.621 [rank:5] [train], epoch: 18/50, iter: 400/834, loss: 0.33777, lr: 1.073912, top1: 0.58052, throughput: 313.38 | 2022-04-11 03:36:09.650 [rank:3] [train], epoch: 18/50, iter: 400/834, loss: 0.33639, lr: 1.073912, top1: 0.58005, throughput: 313.06 | 2022-04-11 03:36:09.659 [rank:7] [train], epoch: 18/50, iter: 400/834, loss: 0.33728, lr: 1.073912, top1: 0.57797, throughput: 313.15 | 2022-04-11 03:36:09.667 [rank:6] [train], epoch: 18/50, iter: 400/834, loss: 0.33782, lr: 1.073912, top1: 0.58021, throughput: 312.75 | 2022-04-11 03:36:09.682 [rank:2] [train], epoch: 18/50, iter: 400/834, loss: 0.33773, lr: 1.073912, top1: 0.57906, throughput: 312.60 | 2022-04-11 03:36:09.691 [rank:5] [train], epoch: 18/50, iter: 500/834, loss: 0.33681, lr: 1.068596, top1: 0.57927, throughput: 314.03 | 2022-04-11 03:37:10.790 [rank:4] [train], epoch: 18/50, iter: 500/834, loss: 0.34179, lr: 1.068596, top1: 0.57427, throughput: 313.52 | 2022-04-11 03:37:10.861 [rank:2] [train], epoch: 18/50, iter: 500/834, loss: 0.33797, lr: 1.068596, top1: 0.57547, throughput: 313.85 | 2022-04-11 03:37:10.867 [rank:3] [train], epoch: 18/50, iter: 500/834, loss: 0.33773, lr: 1.068596, top1: 0.57615, throughput: 313.69 | 2022-04-11 03:37:10.867 [rank:7] [train], epoch: 18/50, iter: 500/834, loss: 0.33715, lr: 1.068596, top1: 0.58010, throughput: 313.60 | 2022-04-11 03:37:10.892 [rank:0] [train], epoch: 18/50, iter: 500/834, loss: 0.33924, lr: 1.068596, top1: 0.57755, throughput: 313.33 | 2022-04-11 03:37:10.899 [rank:1] [train], epoch: 18/50, iter: 500/834, loss: 0.33635, lr: 1.068596, top1: 0.58417, throughput: 313.20 | 2022-04-11 03:37:10.917 [rank:6] [train], epoch: 18/50, iter: 500/834, loss: 0.33658, lr: 1.068596, top1: 0.58422, throughput: 314.02 | 2022-04-11 03:37:10.824 [rank:1] [train], epoch: 18/50, iter: 600/834, loss: 0.33659, lr: 1.063263, top1: 0.57781, throughput: 311.94 | 2022-04-11 03:38:12.469 [rank:4] [train], epoch: 18/50, iter: 600/834, loss: 0.33742, lr: 1.063263, top1: 0.58229, throughput: 311.61 | 2022-04-11 03:38:12.477 [rank:0] [train], epoch: 18/50, iter: 600/834, loss: 0.33601, lr: 1.063263, top1: 0.58354, throughput: 311.72 | 2022-04-11 03:38:12.493 [rank:2] [train], epoch: 18/50, iter: 600/834, loss: 0.33656, lr: 1.063263, top1: 0.58406, throughput: 311.47 | 2022-04-11 03:38:12.511 [rank:5] [train], epoch: 18/50, iter: 600/834, loss: 0.33703, lr: 1.063263, top1: 0.57911, throughput: 311.05 | 2022-04-11 03:38:12.516 [rank:7] [train], epoch: 18/50, iter: 600/834, loss: 0.33981, lr: 1.063263, top1: 0.57307, throughput: 311.52 | 2022-04-11 03:38:12.525 [rank:3] [train], epoch: 18/50, iter: 600/834, loss: 0.33731, lr: 1.063263, top1: 0.58198, throughput: 311.36 | 2022-04-11 03:38:12.531 [rank:6] [train], epoch: 18/50, iter: 600/834, loss: 0.33943, lr: 1.063263, top1: 0.57932, throughput: 311.05 | 2022-04-11 03:38:12.550 [rank:2] [train], epoch: 18/50, iter: 700/834, loss: 0.33648, lr: 1.057914, top1: 0.58667, throughput: 311.59 | 2022-04-11 03:39:14.130 [rank:1] [train], epoch: 18/50, iter: 700/834, loss: 0.33670, lr: 1.057914, top1: 0.58021, throughput: 311.33 | 2022-04-11 03:39:14.140 [rank:6] [train], epoch: 18/50, iter: 700/834, loss: 0.33761, lr: 1.057914, top1: 0.57542, throughput: 311.62 | 2022-04-11 03:39:14.164 [rank:4] [train], epoch: 18/50, iter: 700/834, loss: 0.33643, lr: 1.057914, top1: 0.58286, throughput: 311.21 | 2022-04-11 03:39:14.172 [rank:7] [train], epoch: 18/50, iter: 700/834, loss: 0.33876, lr: 1.057914, top1: 0.58089, throughput: 311.39 | 2022-04-11 03:39:14.185 [rank:5] [train], epoch: 18/50, iter: 700/834, loss: 0.33990, lr: 1.057914, top1: 0.57531, throughput: 311.34 | 2022-04-11 03:39:14.185 [rank:3] [train], epoch: 18/50, iter: 700/834, loss: 0.33680, lr: 1.057914, top1: 0.58109, throughput: 311.41 | 2022-04-11 03:39:14.186 [rank:0] [train], epoch: 18/50, iter: 700/834, loss: 0.33539, lr: 1.057914, top1: 0.58568, throughput: 311.17 | 2022-04-11 03:39:14.196 [rank:4] [train], epoch: 18/50, iter: 800/834, loss: 0.33682, lr: 1.052548, top1: 0.58536, throughput: 313.91 | 2022-04-11 03:40:15.336 [rank:2] [train], epoch: 18/50, iter: 800/834, loss: 0.33997, lr: 1.052548, top1: 0.57250, throughput: 313.36 | 2022-04-11 03:40:15.401 [rank:7] [train], epoch: 18/50, iter: 800/834, loss: 0.33703, lr: 1.052548, top1: 0.58188, throughput: 313.62 | 2022-04-11 03:40:15.405 [rank:6] [train], epoch: 18/50, iter: 800/834, loss: 0.33803, lr: 1.052548, top1: 0.57776, throughput: 313.49 | 2022-04-11 03:40:15.410 [rank:1] [train], epoch: 18/50, iter: 800/834, loss: 0.33713, lr: 1.052548, top1: 0.58349, throughput: 313.20 | 2022-04-11 03:40:15.443 [rank:0] [train], epoch: 18/50, iter: 800/834, loss: 0.33798, lr: 1.052548, top1: 0.57656, throughput: 313.47 | 2022-04-11 03:40:15.447 [rank:5] [train], epoch: 18/50, iter: 800/834, loss: 0.33565, lr: 1.052548, top1: 0.58417, throughput: 313.36 | 2022-04-11 03:40:15.458 [rank:3] [train], epoch: 18/50, iter: 800/834, loss: 0.33705, lr: 1.052548, top1: 0.58078, throughput: 313.32 | 2022-04-11 03:40:15.464 [rank:6] [train], epoch: 18/50, iter: 834/834, loss: 0.33586, lr: 1.050720, top1: 0.58257, throughput: 312.86 | 2022-04-11 03:40:36.276 [rank:0] [train], epoch: 18/50, iter: 834/834, loss: 0.33932, lr: 1.050720, top1: 0.58027, throughput: 313.28 | 2022-04-11 03:40:36.284 [rank:1] [train], epoch: 18/50, iter: 834/834, loss: 0.33831, lr: 1.050720, top1: 0.57874, throughput: 313.17 | 2022-04-11 03:40:36.287 [rank:4] [train], epoch: 18/50, iter: 834/834, loss: 0.33984, lr: 1.050720, top1: 0.57583, throughput: 311.54 | 2022-04-11 03:40:36.290 [rank:7] [train], epoch: 18/50, iter: 834/834, loss: 0.33670, lr: 1.050720, top1: 0.58149, throughput: 312.56 | 2022-04-11 03:40:36.291 [rank:2] [train], epoch: 18/50, iter: 834/834, loss: 0.33503, lr: 1.050720, top1: 0.57721, throughput: 312.40 | 2022-04-11 03:40:36.297 [rank:3] [train], epoch: 18/50, iter: 834/834, loss: 0.33264, lr: 1.050720, top1: 0.58961, throughput: 313.26 | 2022-04-11 03:40:36.303 [rank:5] [train], epoch: 18/50, iter: 834/834, loss: 0.33654, lr: 1.050720, top1: 0.58762, throughput: 312.56 | 2022-04-11 03:40:36.343 [rank:0] [eval], epoch: 18/50, iter: 125/125, loss: 0.00000, lr: 1.050720, top1: 0.60224, throughput: 489.57 | 2022-04-11 03:40:49.050 [rank:2] [eval], epoch: 18/50, iter: 125/125, loss: 0.00000, lr: 1.050720, top1: 0.58736, throughput: 489.50 | 2022-04-11 03:40:49.065 [rank:4] [eval], epoch: 18/50, iter: 125/125, loss: 0.00000, lr: 1.050720, top1: 0.59376, throughput: 489.08 | 2022-04-11 03:40:49.069 [rank:6] [eval], epoch: 18/50, iter: 125/125, loss: 0.00000, lr: 1.050720, top1: 0.59168, throughput: 488.40 | 2022-04-11 03:40:49.073[rank:1] [eval], epoch: 18/50, iter: 125/125, loss: 0.00000, lr: 1.050720, top1: 0.59600, throughput: 488.83 | 2022-04-11 03:40:49.073 [rank:7] [eval], epoch: 18/50, iter: 125/125, loss: 0.00000, lr: 1.050720, top1: 0.58784, throughput: 488.78 | 2022-04-11 03:40:49.078 [rank:3] [eval], epoch: 18/50, iter: 125/125, loss: 0.00000, lr: 1.050720, top1: 0.58416, throughput: 488.69 | 2022-04-11 03:40:49.092 [rank:5] [eval], epoch: 18/50, iter: 125/125, loss: 0.00000, lr: 1.050720, top1: 0.58336, throughput: 488.28 | 2022-04-11 03:40:49.143 [rank:6] [train], epoch: 19/50, iter: 100/834, loss: 0.33270, lr: 1.045332, top1: 0.58724, throughput: 312.86 | 2022-04-11 03:41:50.442 [rank:4] [train], epoch: 19/50, iter: 100/834, loss: 0.33032, lr: 1.045332, top1: 0.59073, throughput: 312.80 | 2022-04-11 03:41:50.451 [rank:2] [train], epoch: 19/50, iter: 100/834, loss: 0.33189, lr: 1.045332, top1: 0.58719, throughput: 312.74 | 2022-04-11 03:41:50.457 [rank:7] [train], epoch: 19/50, iter: 100/834, loss: 0.33336, lr: 1.045332, top1: 0.58755, throughput: 313.13 | 2022-04-11 03:41:50.394 [rank:1] [train], epoch: 19/50, iter: 100/834, loss: 0.32703, lr: 1.045332, top1: 0.59865, throughput: 312.75 | 2022-04-11 03:41:50.463 [rank:3] [train], epoch: 19/50, iter: 100/834, loss: 0.33400, lr: 1.045332, top1: 0.58911, throughput: 313.21 | 2022-04-11 03:41:50.392 [rank:5] [train], epoch: 19/50, iter: 100/834, loss: 0.33045, lr: 1.045332, top1: 0.59266, throughput: 313.03 | 2022-04-11 03:41:50.478 [rank:0] [train], epoch: 19/50, iter: 100/834, loss: 0.33071, lr: 1.045332, top1: 0.58703, throughput: 312.51 | 2022-04-11 03:41:50.489 [rank:6] [train], epoch: 19/50, iter: 200/834, loss: 0.33069, lr: 1.039929, top1: 0.59516, throughput: 312.01 | 2022-04-11 03:42:51.978 [rank:5] [train], epoch: 19/50, iter: 200/834, loss: 0.33305, lr: 1.039929, top1: 0.59109, throughput: 312.19 | 2022-04-11 03:42:51.980 [rank:7] [train], epoch: 19/50, iter: 200/834, loss: 0.33274, lr: 1.039929, top1: 0.58969, throughput: 311.67 | 2022-04-11 03:42:51.998 [rank:2] [train], epoch: 19/50, iter: 200/834, loss: 0.33489, lr: 1.039929, top1: 0.59036, throughput: 311.92 | 2022-04-11 03:42:52.011 [rank:0] [train], epoch: 19/50, iter: 200/834, loss: 0.33372, lr: 1.039929, top1: 0.58797, throughput: 312.00 | 2022-04-11 03:42:52.028 [rank:1] [train], epoch: 19/50, iter: 200/834, loss: 0.32861, lr: 1.039929, top1: 0.59500, throughput: 311.81 | 2022-04-11 03:42:52.038 [rank:3] [train], epoch: 19/50, iter: 200/834, loss: 0.33038, lr: 1.039929, top1: 0.59240, throughput: 311.40 | 2022-04-11 03:42:52.050 [rank:4] [train], epoch: 19/50, iter: 200/834, loss: 0.33393, lr: 1.039929, top1: 0.58589, throughput: 311.67 | 2022-04-11 03:42:52.053 [rank:4] [train], epoch: 19/50, iter: 300/834, loss: 0.33429, lr: 1.034510, top1: 0.58411, throughput: 314.94 | 2022-04-11 03:43:53.017 [rank:2] [train], epoch: 19/50, iter: 300/834, loss: 0.33714, lr: 1.034510, top1: 0.57813, throughput: 314.67 | 2022-04-11 03:43:53.027 [rank:1] [train], epoch: 19/50, iter: 300/834, loss: 0.33301, lr: 1.034510, top1: 0.59047, throughput: 314.73 | 2022-04-11 03:43:53.042 [rank:6] [train], epoch: 19/50, iter: 300/834, loss: 0.33283, lr: 1.034510, top1: 0.58797, throughput: 314.42 | 2022-04-11 03:43:53.043 [rank:5] [train], epoch: 19/50, iter: 300/834, loss: 0.33608, lr: 1.034510, top1: 0.58479, throughput: 314.36 | 2022-04-11 03:43:53.057 [rank:0] [train], epoch: 19/50, iter: 300/834, loss: 0.33217, lr: 1.034510, top1: 0.58917, throughput: 314.51 | 2022-04-11 03:43:53.074 [rank:3] [train], epoch: 19/50, iter: 300/834, loss: 0.33079, lr: 1.034510, top1: 0.59042, throughput: 314.59 | 2022-04-11 03:43:53.081 [rank:7] [train], epoch: 19/50, iter: 300/834, loss: 0.33202, lr: 1.034510, top1: 0.59073, throughput: 314.27 | 2022-04-11 03:43:53.092 [rank:7] [train], epoch: 19/50, iter: 400/834, loss: 0.33600, lr: 1.029076, top1: 0.57974, throughput: 312.14 | 2022-04-11 03:44:54.603 [rank:4] [train], epoch: 19/50, iter: 400/834, loss: 0.33507, lr: 1.029076, top1: 0.58375, throughput: 311.53 | 2022-04-11 03:44:54.648 [rank:3] [train], epoch: 19/50, iter: 400/834, loss: 0.33280, lr: 1.029076, top1: 0.59417, throughput: 311.82 | 2022-04-11 03:44:54.656 [rank:6] [train], epoch: 19/50, iter: 400/834, loss: 0.32998, lr: 1.029076, top1: 0.58964, throughput: 311.59 | 2022-04-11 03:44:54.663 [rank:0] [train], epoch: 19/50, iter: 400/834, loss: 0.33414, lr: 1.029076, top1: 0.58604, throughput: 311.69 | 2022-04-11 03:44:54.674 [rank:1] [train], epoch: 19/50, iter: 400/834, loss: 0.33795, lr: 1.029076, top1: 0.57844, throughput: 311.52 | 2022-04-11 03:44:54.676 [rank:2] [train], epoch: 19/50, iter: 400/834, loss: 0.33677, lr: 1.029076, top1: 0.58161, throughput: 311.37 | 2022-04-11 03:44:54.691 [rank:5] [train], epoch: 19/50, iter: 400/834, loss: 0.33317, lr: 1.029076, top1: 0.58875, throughput: 311.41 | 2022-04-11 03:44:54.711 [rank:4] [train], epoch: 19/50, iter: 500/834, loss: 0.33419, lr: 1.023627, top1: 0.58469, throughput: 313.01 | 2022-04-11 03:45:55.987 [rank:6] [train], epoch: 19/50, iter: 500/834, loss: 0.33399, lr: 1.023627, top1: 0.58641, throughput: 313.08 | 2022-04-11 03:45:55.989 [rank:0] [train], epoch: 19/50, iter: 500/834, loss: 0.33381, lr: 1.023627, top1: 0.58594, throughput: 313.06 | 2022-04-11 03:45:56.005 [rank:5] [train], epoch: 19/50, iter: 500/834, loss: 0.33289, lr: 1.023627, top1: 0.58755, throughput: 313.17 | 2022-04-11 03:45:56.020 [rank:2] [train], epoch: 19/50, iter: 500/834, loss: 0.33118, lr: 1.023627, top1: 0.59120, throughput: 312.96 | 2022-04-11 03:45:56.041 [rank:1] [train], epoch: 19/50, iter: 500/834, loss: 0.33470, lr: 1.023627, top1: 0.58302, throughput: 312.81 | 2022-04-11 03:45:56.056 [rank:3] [train], epoch: 19/50, iter: 500/834, loss: 0.33395, lr: 1.023627, top1: 0.59021, throughput: 313.10 | 2022-04-11 03:45:55.978 [rank:7] [train], epoch: 19/50, iter: 500/834, loss: 0.33551, lr: 1.023627, top1: 0.58427, throughput: 312.27 | 2022-04-11 03:45:56.088 [rank:5] [train], epoch: 19/50, iter: 600/834, loss: 0.33542, lr: 1.018164, top1: 0.58406, throughput: 314.82 | 2022-04-11 03:46:57.008 [rank:0] [train], epoch: 19/50, iter: 600/834, loss: 0.33347, lr: 1.018164, top1: 0.58755, throughput: 314.58 | 2022-04-11 03:46:57.038 [rank:2] [train], epoch: 19/50, iter: 600/834, loss: 0.33408, lr: 1.018164, top1: 0.58802, throughput: 314.77 | 2022-04-11 03:46:57.039 [rank:4] [train], epoch: 19/50, iter: 600/834, loss: 0.33318, lr: 1.018164, top1: 0.58740, throughput: 314.36 | 2022-04-11 03:46:57.065 [rank:7] [train], epoch: 19/50, iter: 600/834, loss: 0.33273, lr: 1.018164, top1: 0.58807, throughput: 314.83 | 2022-04-11 03:46:57.073 [rank:3] [train], epoch: 19/50, iter: 600/834, loss: 0.33480, lr: 1.018164, top1: 0.58620, throughput: 314.26 | 2022-04-11 03:46:57.074 [rank:1] [train], epoch: 19/50, iter: 600/834, loss: 0.33734, lr: 1.018164, top1: 0.58089, throughput: 314.49 | 2022-04-11 03:46:57.106 [rank:6] [train], epoch: 19/50, iter: 600/834, loss: 0.33446, lr: 1.018164, top1: 0.58984, throughput: 314.54 | 2022-04-11 03:46:57.031 [rank:6] [train], epoch: 19/50, iter: 700/834, loss: 0.33664, lr: 1.012687, top1: 0.58260, throughput: 312.76 | 2022-04-11 03:47:58.421 [rank:2] [train], epoch: 19/50, iter: 700/834, loss: 0.33345, lr: 1.012687, top1: 0.58135, throughput: 312.76 | 2022-04-11 03:47:58.428 [rank:4] [train], epoch: 19/50, iter: 700/834, loss: 0.33152, lr: 1.012687, top1: 0.59052, throughput: 312.71 | 2022-04-11 03:47:58.463 [rank:1] [train], epoch: 19/50, iter: 700/834, loss: 0.33531, lr: 1.012687, top1: 0.58521, throughput: 312.91 | 2022-04-11 03:47:58.467 [rank:5] [train], epoch: 19/50, iter: 700/834, loss: 0.33457, lr: 1.012687, top1: 0.58594, throughput: 312.39 | 2022-04-11 03:47:58.469 [rank:3] [train], epoch: 19/50, iter: 700/834, loss: 0.33318, lr: 1.012687, top1: 0.58672, throughput: 312.67 | 2022-04-11 03:47:58.481 [rank:7] [train], epoch: 19/50, iter: 700/834, loss: 0.33323, lr: 1.012687, top1: 0.58792, throughput: 312.55 | 2022-04-11 03:47:58.504 [rank:0] [train], epoch: 19/50, iter: 700/834, loss: 0.33355, lr: 1.012687, top1: 0.58641, throughput: 312.34 | 2022-04-11 03:47:58.509 [rank:6] [train], epoch: 19/50, iter: 800/834, loss: 0.33332, lr: 1.007195, top1: 0.59062, throughput: 311.92 | 2022-04-11 03:48:59.975 [rank:0] [train], epoch: 19/50, iter: 800/834, loss: 0.33594, lr: 1.007195, top1: 0.58599, throughput: 312.05 | 2022-04-11 03:49:00.038 [rank:1] [train], epoch: 19/50, iter: 800/834, loss: 0.33439, lr: 1.007195, top1: 0.58714, throughput: 311.83 | 2022-04-11 03:49:00.039 [rank:7] [train], epoch: 19/50, iter: 800/834, loss: 0.33330, lr: 1.007195, top1: 0.59031, throughput: 312.01 | 2022-04-11 03:49:00.041 [rank:5] [train], epoch: 19/50, iter: 800/834, loss: 0.33394, lr: 1.007195, top1: 0.58729, throughput: 311.78 | 2022-04-11 03:49:00.052 [rank:2] [train], epoch: 19/50, iter: 800/834, loss: 0.33276, lr: 1.007195, top1: 0.58953, throughput: 311.52 | 2022-04-11 03:49:00.062 [rank:3] [train], epoch: 19/50, iter: 800/834, loss: 0.33211, lr: 1.007195, top1: 0.59115, throughput: 311.74 | 2022-04-11 03:49:00.070 [rank:4] [train], epoch: 19/50, iter: 800/834, loss: 0.33506, lr: 1.007195, top1: 0.58260, throughput: 311.99 | 2022-04-11 03:49:00.004 [rank:4] [train], epoch: 19/50, iter: 834/834, loss: 0.33572, lr: 1.005325, top1: 0.58211, throughput: 312.31 | 2022-04-11 03:49:20.906 [rank:7] [train], epoch: 19/50, iter: 834/834, loss: 0.33370, lr: 1.005325, top1: 0.57736, throughput: 312.68 | 2022-04-11 03:49:20.919 [rank:1] [train], epoch: 19/50, iter: 834/834, loss: 0.33513, lr: 1.005325, top1: 0.58042, throughput: 312.47 | 2022-04-11 03:49:20.930 [rank:2] [train], epoch: 19/50, iter: 834/834, loss: 0.33001, lr: 1.005325, top1: 0.58992, throughput: 312.81 | 2022-04-11 03:49:20.931 [rank:3] [train], epoch: 19/50, iter: 834/834, loss: 0.33484, lr: 1.005325, top1: 0.59053, throughput: 312.86 | 2022-04-11 03:49:20.936 [rank:0] [train], epoch: 19/50, iter: 834/834, loss: 0.33605, lr: 1.005325, top1: 0.58333, throughput: 312.36 | 2022-04-11 03:49:20.937 [rank:5] [train], epoch: 19/50, iter: 834/834, loss: 0.33279, lr: 1.005325, top1: 0.58257, throughput: 312.04 | 2022-04-11 03:49:20.972 [rank:6] [train], epoch: 19/50, iter: 834/834, loss: 0.33915, lr: 1.005325, top1: 0.57062, throughput: 310.89 | 2022-04-11 03:49:20.973 [rank:0] [eval], epoch: 19/50, iter: 125/125, loss: 0.00000, lr: 1.005325, top1: 0.57104, throughput: 495.83 | 2022-04-11 03:49:33.542 [rank:2] [eval], epoch: 19/50, iter: 125/125, loss: 0.00000, lr: 1.005325, top1: 0.56224, throughput: 495.30 | 2022-04-11 03:49:33.549 [rank:1] [eval], epoch: 19/50, iter: 125/125, loss: 0.00000, lr: 1.005325, top1: 0.57760, throughput: 494.74 | 2022-04-11 03:49:33.563 [rank:4] [eval], epoch: 19/50, iter: 125/125, loss: 0.00000, lr: 1.005325, top1: 0.56224, throughput: 493.74 | 2022-04-11 03:49:33.565 [rank:6] [eval], epoch: 19/50, iter: 125/125, loss: 0.00000, lr: 1.005325, top1: 0.57456, throughput: 496.16 | 2022-04-11 03:49:33.569 [rank:7] [eval], epoch: 19/50, iter: 125/125, loss: 0.00000, lr: 1.005325, top1: 0.56224, throughput: 493.94 | 2022-04-11 03:49:33.572 [rank:3] [eval], epoch: 19/50, iter: 125/125, loss: 0.00000, lr: 1.005325, top1: 0.56544, throughput: 493.72 | 2022-04-11 03:49:33.595 [rank:5] [eval], epoch: 19/50, iter: 125/125, loss: 0.00000, lr: 1.005325, top1: 0.56064, throughput: 495.05 | 2022-04-11 03:49:33.597 [rank:3] [train], epoch: 20/50, iter: 100/834, loss: 0.32988, lr: 0.999816, top1: 0.59385, throughput: 313.23 | 2022-04-11 03:50:34.891 [rank:4] [train], epoch: 20/50, iter: 100/834, loss: 0.32876, lr: 0.999816, top1: 0.59875, throughput: 312.91 | 2022-04-11 03:50:34.923 [rank:2] [train], epoch: 20/50, iter: 100/834, loss: 0.32896, lr: 0.999816, top1: 0.59036, throughput: 312.74 | 2022-04-11 03:50:34.943 [rank:7] [train], epoch: 20/50, iter: 100/834, loss: 0.32792, lr: 0.999816, top1: 0.59984, throughput: 312.82 | 2022-04-11 03:50:34.949 [rank:0] [train], epoch: 20/50, iter: 100/834, loss: 0.32723, lr: 0.999816, top1: 0.60276, throughput: 312.63 | 2022-04-11 03:50:34.956 [rank:6] [train], epoch: 20/50, iter: 100/834, loss: 0.33004, lr: 0.999816, top1: 0.59349, throughput: 312.69 | 2022-04-11 03:50:34.972 [rank:5] [train], epoch: 20/50, iter: 100/834, loss: 0.33026, lr: 0.999816, top1: 0.59469, throughput: 312.78 | 2022-04-11 03:50:34.982 [rank:1] [train], epoch: 20/50, iter: 100/834, loss: 0.33350, lr: 0.999816, top1: 0.58766, throughput: 312.48 | 2022-04-11 03:50:35.007 [rank:4] [train], epoch: 20/50, iter: 200/834, loss: 0.32740, lr: 0.994293, top1: 0.59708, throughput: 312.79 | 2022-04-11 03:51:36.307 [rank:3] [train], epoch: 20/50, iter: 200/834, loss: 0.33042, lr: 0.994293, top1: 0.59010, throughput: 312.61 | 2022-04-11 03:51:36.308 [rank:6] [train], epoch: 20/50, iter: 200/834, loss: 0.33105, lr: 0.994293, top1: 0.59552, throughput: 312.95 | 2022-04-11 03:51:36.323 [rank:0] [train], epoch: 20/50, iter: 200/834, loss: 0.33030, lr: 0.994293, top1: 0.59740, throughput: 312.82 | 2022-04-11 03:51:36.334 [rank:2] [train], epoch: 20/50, iter: 200/834, loss: 0.32843, lr: 0.994293, top1: 0.59635, throughput: 312.73 | 2022-04-11 03:51:36.337 [rank:5] [train], epoch: 20/50, iter: 200/834, loss: 0.32756, lr: 0.994293, top1: 0.59958, throughput: 312.88 | 2022-04-11 03:51:36.348 [rank:1] [train], epoch: 20/50, iter: 200/834, loss: 0.32842, lr: 0.994293, top1: 0.59599, throughput: 313.00 | 2022-04-11 03:51:36.348 [rank:7] [train], epoch: 20/50, iter: 200/834, loss: 0.32879, lr: 0.994293, top1: 0.59464, throughput: 312.70 | 2022-04-11 03:51:36.351 [rank:2] [train], epoch: 20/50, iter: 300/834, loss: 0.32860, lr: 0.988758, top1: 0.59531, throughput: 314.04 | 2022-04-11 03:52:37.476 [rank:5] [train], epoch: 20/50, iter: 300/834, loss: 0.33151, lr: 0.988758, top1: 0.58870, throughput: 314.05 | 2022-04-11 03:52:37.484 [rank:4] [train], epoch: 20/50, iter: 300/834, loss: 0.33175, lr: 0.988758, top1: 0.58714, throughput: 313.83 | 2022-04-11 03:52:37.486 [rank:3] [train], epoch: 20/50, iter: 300/834, loss: 0.33018, lr: 0.988758, top1: 0.59448, throughput: 313.80 | 2022-04-11 03:52:37.494 [rank:0] [train], epoch: 20/50, iter: 300/834, loss: 0.33298, lr: 0.988758, top1: 0.58661, throughput: 313.88 | 2022-04-11 03:52:37.505 [rank:7] [train], epoch: 20/50, iter: 300/834, loss: 0.32996, lr: 0.988758, top1: 0.58995, throughput: 313.84 | 2022-04-11 03:52:37.528 [rank:6] [train], epoch: 20/50, iter: 300/834, loss: 0.32908, lr: 0.988758, top1: 0.59516, throughput: 313.66 | 2022-04-11 03:52:37.535 [rank:1] [train], epoch: 20/50, iter: 300/834, loss: 0.33024, lr: 0.988758, top1: 0.59771, throughput: 313.69 | 2022-04-11 03:52:37.555 [rank:7] [train], epoch: 20/50, iter: 400/834, loss: 0.33023, lr: 0.983210, top1: 0.58911, throughput: 313.60 | 2022-04-11 03:53:38.753 [rank:6] [train], epoch: 20/50, iter: 400/834, loss: 0.32931, lr: 0.983210, top1: 0.59479, throughput: 313.61 | 2022-04-11 03:53:38.758 [rank:2] [train], epoch: 20/50, iter: 400/834, loss: 0.33187, lr: 0.983210, top1: 0.59344, throughput: 313.21 | 2022-04-11 03:53:38.777 [rank:3] [train], epoch: 20/50, iter: 400/834, loss: 0.33145, lr: 0.983210, top1: 0.59182, throughput: 313.55 | 2022-04-11 03:53:38.729 [rank:4] [train], epoch: 20/50, iter: 400/834, loss: 0.32819, lr: 0.983210, top1: 0.59693, throughput: 313.19 | 2022-04-11 03:53:38.791 [rank:5] [train], epoch: 20/50, iter: 400/834, loss: 0.33131, lr: 0.983210, top1: 0.59474, throughput: 313.16 | 2022-04-11 03:53:38.794 [rank:1] [train], epoch: 20/50, iter: 400/834, loss: 0.33199, lr: 0.983210, top1: 0.58740, throughput: 313.25 | 2022-04-11 03:53:38.847 [rank:0] [train], epoch: 20/50, iter: 400/834, loss: 0.33245, lr: 0.983210, top1: 0.58911, throughput: 312.97 | 2022-04-11 03:53:38.852 [rank:1] [train], epoch: 20/50, iter: 500/834, loss: 0.32779, lr: 0.977649, top1: 0.60005, throughput: 312.32 | 2022-04-11 03:54:40.322 [rank:4] [train], epoch: 20/50, iter: 500/834, loss: 0.33199, lr: 0.977649, top1: 0.58615, throughput: 312.00 | 2022-04-11 03:54:40.330 [rank:2] [train], epoch: 20/50, iter: 500/834, loss: 0.33170, lr: 0.977649, top1: 0.59187, throughput: 311.92 | 2022-04-11 03:54:40.331 [rank:7] [train], epoch: 20/50, iter: 500/834, loss: 0.33094, lr: 0.977649, top1: 0.59089, throughput: 311.67 | 2022-04-11 03:54:40.357 [rank:5] [train], epoch: 20/50, iter: 500/834, loss: 0.33294, lr: 0.977649, top1: 0.58938, throughput: 311.84 | 2022-04-11 03:54:40.363 [rank:0] [train], epoch: 20/50, iter: 500/834, loss: 0.33363, lr: 0.977649, top1: 0.58984, throughput: 312.09 | 2022-04-11 03:54:40.372 [rank:3] [train], epoch: 20/50, iter: 500/834, loss: 0.33313, lr: 0.977649, top1: 0.58760, throughput: 311.37 | 2022-04-11 03:54:40.392 [rank:6] [train], epoch: 20/50, iter: 500/834, loss: 0.33194, lr: 0.977649, top1: 0.59245, throughput: 311.45 | 2022-04-11 03:54:40.406 [rank:4] [train], epoch: 20/50, iter: 600/834, loss: 0.33094, lr: 0.972077, top1: 0.59182, throughput: 314.02 | 2022-04-11 03:55:41.473 [rank:7] [train], epoch: 20/50, iter: 600/834, loss: 0.33142, lr: 0.972077, top1: 0.59063, throughput: 313.89 | 2022-04-11 03:55:41.526 [rank:3] [train], epoch: 20/50, iter: 600/834, loss: 0.33167, lr: 0.972077, top1: 0.59125, throughput: 314.00 | 2022-04-11 03:55:41.538 [rank:2] [train], epoch: 20/50, iter: 600/834, loss: 0.33199, lr: 0.972077, top1: 0.58984, throughput: 313.67 | 2022-04-11 03:55:41.543 [rank:6] [train], epoch: 20/50, iter: 600/834, loss: 0.33175, lr: 0.972077, top1: 0.59188, throughput: 314.05 | 2022-04-11 03:55:41.544 [rank:1] [train], epoch: 20/50, iter: 600/834, loss: 0.33326, lr: 0.972077, top1: 0.58802, throughput: 313.50 | 2022-04-11 03:55:41.566 [rank:0] [train], epoch: 20/50, iter: 600/834, loss: 0.33145, lr: 0.972077, top1: 0.59255, throughput: 313.74 | 2022-04-11 03:55:41.569 [rank:5] [train], epoch: 20/50, iter: 600/834, loss: 0.33333, lr: 0.972077, top1: 0.58682, throughput: 313.63 | 2022-04-11 03:55:41.582 [rank:6] [train], epoch: 20/50, iter: 700/834, loss: 0.33343, lr: 0.966494, top1: 0.58432, throughput: 314.50 | 2022-04-11 03:56:42.593 [rank:3] [train], epoch: 20/50, iter: 700/834, loss: 0.33057, lr: 0.966494, top1: 0.59193, throughput: 314.43 | 2022-04-11 03:56:42.601 [rank:5] [train], epoch: 20/50, iter: 700/834, loss: 0.32910, lr: 0.966494, top1: 0.59474, throughput: 314.58 | 2022-04-11 03:56:42.615 [rank:0] [train], epoch: 20/50, iter: 700/834, loss: 0.33308, lr: 0.966494, top1: 0.59063, throughput: 314.51 | 2022-04-11 03:56:42.616 [rank:4] [train], epoch: 20/50, iter: 700/834, loss: 0.33271, lr: 0.966494, top1: 0.58677, throughput: 313.95 | 2022-04-11 03:56:42.629 [rank:2] [train], epoch: 20/50, iter: 700/834, loss: 0.33118, lr: 0.966494, top1: 0.59115, throughput: 314.27 | 2022-04-11 03:56:42.637 [rank:1] [train], epoch: 20/50, iter: 700/834, loss: 0.33221, lr: 0.966494, top1: 0.58729, throughput: 314.29 | 2022-04-11 03:56:42.655 [rank:7] [train], epoch: 20/50, iter: 700/834, loss: 0.33064, lr: 0.966494, top1: 0.59370, throughput: 314.47 | 2022-04-11 03:56:42.581 [rank:4] [train], epoch: 20/50, iter: 800/834, loss: 0.32997, lr: 0.960899, top1: 0.58896, throughput: 313.14 | 2022-04-11 03:57:43.942 [rank:5] [train], epoch: 20/50, iter: 800/834, loss: 0.33333, lr: 0.960899, top1: 0.58682, throughput: 313.06 | 2022-04-11 03:57:43.946 [rank:2] [train], epoch: 20/50, iter: 800/834, loss: 0.33080, lr: 0.960899, top1: 0.59229, throughput: 313.10 | 2022-04-11 03:57:43.960 [rank:6] [train], epoch: 20/50, iter: 800/834, loss: 0.33069, lr: 0.960899, top1: 0.59312, throughput: 312.80 | 2022-04-11 03:57:43.974 [rank:0] [train], epoch: 20/50, iter: 800/834, loss: 0.33196, lr: 0.960899, top1: 0.59177, throughput: 312.87 | 2022-04-11 03:57:43.983 [rank:3] [train], epoch: 20/50, iter: 800/834, loss: 0.33279, lr: 0.960899, top1: 0.58901, throughput: 312.72 | 2022-04-11 03:57:43.998 [rank:1] [train], epoch: 20/50, iter: 800/834, loss: 0.33385, lr: 0.960899, top1: 0.58958, throughput: 312.96 | 2022-04-11 03:57:44.004 [rank:7] [train], epoch: 20/50, iter: 800/834, loss: 0.33498, lr: 0.960899, top1: 0.58552, throughput: 312.97 | 2022-04-11 03:57:43.928 [rank:5] [train], epoch: 20/50, iter: 834/834, loss: 0.33236, lr: 0.958994, top1: 0.58946, throughput: 314.81 | 2022-04-11 03:58:04.682 [rank:6] [train], epoch: 20/50, iter: 834/834, loss: 0.33115, lr: 0.958994, top1: 0.59298, throughput: 314.49 | 2022-04-11 03:58:04.732 [rank:4] [train], epoch: 20/50, iter: 834/834, loss: 0.33526, lr: 0.958994, top1: 0.57767, throughput: 313.83 | 2022-04-11 03:58:04.744 [rank:0] [train], epoch: 20/50, iter: 834/834, loss: 0.33102, lr: 0.958994, top1: 0.59406, throughput: 314.42 | 2022-04-11 03:58:04.745 [rank:7] [train], epoch: 20/50, iter: 834/834, loss: 0.33774, lr: 0.958994, top1: 0.58532, throughput: 313.47 | 2022-04-11 03:58:04.752 [rank:1] [train], epoch: 20/50, iter: 834/834, loss: 0.33162, lr: 0.958994, top1: 0.59038, throughput: 314.19 | 2022-04-11 03:58:04.781 [rank:2] [train], epoch: 20/50, iter: 834/834, loss: 0.33440, lr: 0.958994, top1: 0.58808, throughput: 313.36 | 2022-04-11 03:58:04.792 [rank:3] [train], epoch: 20/50, iter: 834/834, loss: 0.33534, lr: 0.958994, top1: 0.58272, throughput: 314.68 | 2022-04-11 03:58:04.742 [rank:0] [eval], epoch: 20/50, iter: 125/125, loss: 0.00000, lr: 0.958994, top1: 0.61088, throughput: 496.30 | 2022-04-11 03:58:17.339 [rank:2] [eval], epoch: 20/50, iter: 125/125, loss: 0.00000, lr: 0.958994, top1: 0.59616, throughput: 497.38 | 2022-04-11 03:58:17.358 [rank:7] [eval], epoch: 20/50, iter: 125/125, loss: 0.00000, lr: 0.958994, top1: 0.60288, throughput: 495.75 | 2022-04-11 03:58:17.360 [rank:1] [eval], epoch: 20/50, iter: 125/125, loss: 0.00000, lr: 0.958994, top1: 0.61008, throughput: 496.64 | 2022-04-11 03:58:17.366 [rank:6] [eval], epoch: 20/50, iter: 125/125, loss: 0.00000, lr: 0.958994, top1: 0.60176, throughput: 494.16 | 2022-04-11 03:58:17.379 [rank:3] [eval], epoch: 20/50, iter: 125/125, loss: 0.00000, lr: 0.958994, top1: 0.59856, throughput: 494.52 | 2022-04-11 03:58:17.381 [rank:4] [eval], epoch: 20/50, iter: 125/125, loss: 0.00000, lr: 0.958994, top1: 0.60192, throughput: 494.29 | 2022-04-11 03:58:17.388 [rank:5] [eval], epoch: 20/50, iter: 125/125, loss: 0.00000, lr: 0.958994, top1: 0.59744, throughput: 490.66 | 2022-04-11 03:58:17.420 [rank:1] [train], epoch: 21/50, iter: 100/834, loss: 0.32619, lr: 0.953384, top1: 0.59927, throughput: 311.87 | 2022-04-11 03:59:18.929 [rank:6] [train], epoch: 21/50, iter: 100/834, loss: 0.33074, lr: 0.953384, top1: 0.59464, throughput: 311.85 | 2022-04-11 03:59:18.947 [rank:5] [train], epoch: 21/50, iter: 100/834, loss: 0.32644, lr: 0.953384, top1: 0.60234, throughput: 312.01 | 2022-04-11 03:59:18.956 [rank:2] [train], epoch: 21/50, iter: 100/834, loss: 0.32277, lr: 0.953384, top1: 0.60786, throughput: 311.59 | 2022-04-11 03:59:18.977 [rank:3] [train], epoch: 21/50, iter: 100/834, loss: 0.32309, lr: 0.953384, top1: 0.61000, throughput: 311.67 | 2022-04-11 03:59:18.985 [rank:7] [train], epoch: 21/50, iter: 100/834, loss: 0.32181, lr: 0.953384, top1: 0.61359, throughput: 311.56 | 2022-04-11 03:59:18.985 [rank:0] [train], epoch: 21/50, iter: 100/834, loss: 0.32922, lr: 0.953384, top1: 0.59250, throughput: 311.44 | 2022-04-11 03:59:18.988 [rank:4] [train], epoch: 21/50, iter: 100/834, loss: 0.32677, lr: 0.953384, top1: 0.60151, throughput: 311.61 | 2022-04-11 03:59:19.005 [rank:3] [train], epoch: 21/50, iter: 200/834, loss: 0.32643, lr: 0.947764, top1: 0.59807, throughput: 313.60 | 2022-04-11 04:00:20.210 [rank:6] [train], epoch: 21/50, iter: 200/834, loss: 0.32736, lr: 0.947764, top1: 0.60036, throughput: 313.30 | 2022-04-11 04:00:20.230 [rank:5] [train], epoch: 21/50, iter: 200/834, loss: 0.32380, lr: 0.947764, top1: 0.60672, throughput: 313.35 | 2022-04-11 04:00:20.230 [rank:0] [train], epoch: 21/50, iter: 200/834, loss: 0.32802, lr: 0.947764, top1: 0.59505, throughput: 313.49 | 2022-04-11 04:00:20.233 [rank:1] [train], epoch: 21/50, iter: 200/834, loss: 0.32555, lr: 0.947764, top1: 0.59943, throughput: 313.13 | 2022-04-11 04:00:20.245 [rank:7] [train], epoch: 21/50, iter: 200/834, loss: 0.32767, lr: 0.947764, top1: 0.59578, throughput: 313.38 | 2022-04-11 04:00:20.253 [rank:2] [train], epoch: 21/50, iter: 200/834, loss: 0.32661, lr: 0.947764, top1: 0.59849, throughput: 313.33 | 2022-04-11 04:00:20.255 [rank:4] [train], epoch: 21/50, iter: 200/834, loss: 0.32831, lr: 0.947764, top1: 0.59427, throughput: 313.68 | 2022-04-11 04:00:20.214 [rank:1] [train], epoch: 21/50, iter: 300/834, loss: 0.32783, lr: 0.942134, top1: 0.59297, throughput: 313.38 | 2022-04-11 04:01:21.512 [rank:6] [train], epoch: 21/50, iter: 300/834, loss: 0.32960, lr: 0.942134, top1: 0.59323, throughput: 313.23 | 2022-04-11 04:01:21.526 [rank:2] [train], epoch: 21/50, iter: 300/834, loss: 0.32435, lr: 0.942134, top1: 0.60719, throughput: 313.33 | 2022-04-11 04:01:21.532 [rank:3] [train], epoch: 21/50, iter: 300/834, loss: 0.32710, lr: 0.942134, top1: 0.60203, throughput: 313.05 | 2022-04-11 04:01:21.541 [rank:0] [train], epoch: 21/50, iter: 300/834, loss: 0.32592, lr: 0.942134, top1: 0.60208, throughput: 313.12 | 2022-04-11 04:01:21.551 [rank:5] [train], epoch: 21/50, iter: 300/834, loss: 0.32818, lr: 0.942134, top1: 0.59688, throughput: 313.09 | 2022-04-11 04:01:21.555 [rank:7] [train], epoch: 21/50, iter: 300/834, loss: 0.32938, lr: 0.942134, top1: 0.59328, throughput: 313.18 | 2022-04-11 04:01:21.560 [rank:4] [train], epoch: 21/50, iter: 300/834, loss: 0.32846, lr: 0.942134, top1: 0.59833, throughput: 312.92 | 2022-04-11 04:01:21.571 [rank:7] [train], epoch: 21/50, iter: 400/834, loss: 0.32838, lr: 0.936494, top1: 0.59375, throughput: 314.19 | 2022-04-11 04:02:22.670 [rank:1] [train], epoch: 21/50, iter: 400/834, loss: 0.32661, lr: 0.936494, top1: 0.60333, throughput: 313.88 | 2022-04-11 04:02:22.683 [rank:5] [train], epoch: 21/50, iter: 400/834, loss: 0.32800, lr: 0.936494, top1: 0.60146, throughput: 313.99 | 2022-04-11 04:02:22.702 [rank:6] [train], epoch: 21/50, iter: 400/834, loss: 0.32982, lr: 0.936494, top1: 0.59135, throughput: 313.81 | 2022-04-11 04:02:22.709 [rank:0] [train], epoch: 21/50, iter: 400/834, loss: 0.32749, lr: 0.936494, top1: 0.59828, throughput: 313.87 | 2022-04-11 04:02:22.723 [rank:3] [train], epoch: 21/50, iter: 400/834, loss: 0.32828, lr: 0.936494, top1: 0.59687, throughput: 313.76 | 2022-04-11 04:02:22.734 [rank:4] [train], epoch: 21/50, iter: 400/834, loss: 0.32619, lr: 0.936494, top1: 0.60359, throughput: 314.32 | 2022-04-11 04:02:22.656 [rank:2] [train], epoch: 21/50, iter: 400/834, loss: 0.32811, lr: 0.936494, top1: 0.59630, throughput: 314.10 | 2022-04-11 04:02:22.659 [rank:5] [train], epoch: 21/50, iter: 500/834, loss: 0.32938, lr: 0.930844, top1: 0.59151, throughput: 314.30 | 2022-04-11 04:03:23.791 [rank:3] [train], epoch: 21/50, iter: 500/834, loss: 0.32566, lr: 0.930844, top1: 0.60510, throughput: 314.40 | 2022-04-11 04:03:23.802 [rank:0] [train], epoch: 21/50, iter: 500/834, loss: 0.33021, lr: 0.930844, top1: 0.59281, throughput: 314.31 | 2022-04-11 04:03:23.810 [rank:4] [train], epoch: 21/50, iter: 500/834, loss: 0.32621, lr: 0.930844, top1: 0.60260, throughput: 313.95 | 2022-04-11 04:03:23.812 [rank:6] [train], epoch: 21/50, iter: 500/834, loss: 0.32950, lr: 0.930844, top1: 0.59417, throughput: 314.10 | 2022-04-11 04:03:23.837 [rank:1] [train], epoch: 21/50, iter: 500/834, loss: 0.32847, lr: 0.930844, top1: 0.59859, throughput: 313.90 | 2022-04-11 04:03:23.849 [rank:7] [train], epoch: 21/50, iter: 500/834, loss: 0.32976, lr: 0.930844, top1: 0.59318, throughput: 313.73 | 2022-04-11 04:03:23.868 [rank:2] [train], epoch: 21/50, iter: 500/834, loss: 0.32939, lr: 0.930844, top1: 0.59526, throughput: 313.64 | 2022-04-11 04:03:23.876 [rank:4] [train], epoch: 21/50, iter: 600/834, loss: 0.32956, lr: 0.925185, top1: 0.59297, throughput: 313.11 | 2022-04-11 04:04:25.133 [rank:7] [train], epoch: 21/50, iter: 600/834, loss: 0.32884, lr: 0.925185, top1: 0.59583, throughput: 313.29 | 2022-04-11 04:04:25.153 [rank:2] [train], epoch: 21/50, iter: 600/834, loss: 0.32608, lr: 0.925185, top1: 0.60135, throughput: 313.32 | 2022-04-11 04:04:25.155 [rank:5] [train], epoch: 21/50, iter: 600/834, loss: 0.32695, lr: 0.925185, top1: 0.59927, throughput: 312.79 | 2022-04-11 04:04:25.174 [rank:6] [train], epoch: 21/50, iter: 600/834, loss: 0.32817, lr: 0.925185, top1: 0.59396, throughput: 312.98 | 2022-04-11 04:04:25.183 [rank:1] [train], epoch: 21/50, iter: 600/834, loss: 0.33016, lr: 0.925185, top1: 0.59031, throughput: 313.01 | 2022-04-11 04:04:25.189 [rank:3] [train], epoch: 21/50, iter: 600/834, loss: 0.33204, lr: 0.925185, top1: 0.59010, throughput: 313.04 | 2022-04-11 04:04:25.136 [rank:0] [train], epoch: 21/50, iter: 600/834, loss: 0.32783, lr: 0.925185, top1: 0.59729, throughput: 313.09 | 2022-04-11 04:04:25.135 [rank:6] [train], epoch: 21/50, iter: 700/834, loss: 0.32651, lr: 0.919517, top1: 0.60203, throughput: 313.50 | 2022-04-11 04:05:26.428 [rank:2] [train], epoch: 21/50, iter: 700/834, loss: 0.33120, lr: 0.919517, top1: 0.58938, throughput: 313.08 | 2022-04-11 04:05:26.481 [rank:7] [train], epoch: 21/50, iter: 700/834, loss: 0.32666, lr: 0.919517, top1: 0.60135, throughput: 313.00 | 2022-04-11 04:05:26.495 [rank:4] [train], epoch: 21/50, iter: 700/834, loss: 0.32552, lr: 0.919517, top1: 0.60286, throughput: 312.79 | 2022-04-11 04:05:26.516 [rank:1] [train], epoch: 21/50, iter: 700/834, loss: 0.32992, lr: 0.919517, top1: 0.59484, throughput: 312.99 | 2022-04-11 04:05:26.532 [rank:0] [train], epoch: 21/50, iter: 700/834, loss: 0.33058, lr: 0.919517, top1: 0.59021, throughput: 312.62 | 2022-04-11 04:05:26.552 [rank:5] [train], epoch: 21/50, iter: 700/834, loss: 0.33193, lr: 0.919517, top1: 0.59458, throughput: 312.75 | 2022-04-11 04:05:26.565 [rank:3] [train], epoch: 21/50, iter: 700/834, loss: 0.32808, lr: 0.919517, top1: 0.59854, throughput: 312.79 | 2022-04-11 04:05:26.518 [rank:4] [train], epoch: 21/50, iter: 800/834, loss: 0.32781, lr: 0.913841, top1: 0.59620, throughput: 313.38 | 2022-04-11 04:06:27.785 [rank:2] [train], epoch: 21/50, iter: 800/834, loss: 0.32506, lr: 0.913841, top1: 0.60073, throughput: 312.89 | 2022-04-11 04:06:27.845 [rank:7] [train], epoch: 21/50, iter: 800/834, loss: 0.32919, lr: 0.913841, top1: 0.59474, throughput: 312.85 | 2022-04-11 04:06:27.866 [rank:6] [train], epoch: 21/50, iter: 800/834, loss: 0.32673, lr: 0.913841, top1: 0.59969, throughput: 312.42 | 2022-04-11 04:06:27.883 [rank:1] [train], epoch: 21/50, iter: 800/834, loss: 0.32826, lr: 0.913841, top1: 0.59620, throughput: 312.93 | 2022-04-11 04:06:27.888 [rank:5] [train], epoch: 21/50, iter: 800/834, loss: 0.32757, lr: 0.913841, top1: 0.59682, throughput: 313.09 | 2022-04-11 04:06:27.888 [rank:0] [train], epoch: 21/50, iter: 800/834, loss: 0.32805, lr: 0.913841, top1: 0.59208, throughput: 313.01 | 2022-04-11 04:06:27.892 [rank:3] [train], epoch: 21/50, iter: 800/834, loss: 0.32810, lr: 0.913841, top1: 0.59599, throughput: 312.76 | 2022-04-11 04:06:27.908 [rank:4] [train], epoch: 21/50, iter: 834/834, loss: 0.32382, lr: 0.911909, top1: 0.59743, throughput: 310.12 | 2022-04-11 04:06:48.835 [rank:5] [train], epoch: 21/50, iter: 834/834, loss: 0.33113, lr: 0.911909, top1: 0.58517, throughput: 311.64 | 2022-04-11 04:06:48.835 [rank:7] [train], epoch: 21/50, iter: 834/834, loss: 0.32701, lr: 0.911909, top1: 0.60034, throughput: 311.21 | 2022-04-11 04:06:48.842 [rank:3] [train], epoch: 21/50, iter: 834/834, loss: 0.32608, lr: 0.911909, top1: 0.59881, throughput: 311.81 | 2022-04-11 04:06:48.844 [rank:6] [train], epoch: 21/50, iter: 834/834, loss: 0.32257, lr: 0.911909, top1: 0.61320, throughput: 311.42 | 2022-04-11 04:06:48.845 [rank:0] [train], epoch: 21/50, iter: 834/834, loss: 0.32883, lr: 0.911909, top1: 0.59145, throughput: 311.54[rank:2] [train], epoch: 21/50, iter: 834/834, loss: 0.32875, lr: 0.911909, top1: 0.59467, throughput: 310.84 | 2022-04-11 04:06:48.846 | 2022-04-11 04:06:48.846 [rank:1] [train], epoch: 21/50, iter: 834/834, loss: 0.32914, lr: 0.911909, top1: 0.59589, throughput: 310.82 | 2022-04-11 04:06:48.891 [rank:0] [eval], epoch: 21/50, iter: 125/125, loss: 0.00000, lr: 0.911909, top1: 0.63040, throughput: 495.72 | 2022-04-11 04:07:01.454 [rank:2] [eval], epoch: 21/50, iter: 125/125, loss: 0.00000, lr: 0.911909, top1: 0.60752, throughput: 495.68 | 2022-04-11 04:07:01.455 [rank:3] [eval], epoch: 21/50, iter: 125/125, loss: 0.00000, lr: 0.911909, top1: 0.61136, throughput: 495.27 | 2022-04-11 04:07:01.463 [rank:5] [eval], epoch: 21/50, iter: 125/125, loss: 0.00000, lr: 0.911909, top1: 0.60752, throughput: 494.62 | 2022-04-11 04:07:01.471 [rank:7] [eval], epoch: 21/50, iter: 125/125, loss: 0.00000, lr: 0.911909, top1: 0.62080, throughput: 494.57 | 2022-04-11 04:07:01.479 [rank:6] [eval], epoch: 21/50, iter: 125/125, loss: 0.00000, lr: 0.911909, top1: 0.61808, throughput: 494.49 | 2022-04-11 04:07:01.484 [rank:1] [eval], epoch: 21/50, iter: 125/125, loss: 0.00000, lr: 0.911909, top1: 0.62160, throughput: 495.83 | 2022-04-11 04:07:01.496 [rank:4] [eval], epoch: 21/50, iter: 125/125, loss: 0.00000, lr: 0.911909, top1: 0.61936, throughput: 493.57 | 2022-04-11 04:07:01.498 [rank:5] [train], epoch: 22/50, iter: 100/834, loss: 0.32481, lr: 0.906221, top1: 0.60635, throughput: 313.78 | 2022-04-11 04:08:02.661 [rank:4] [train], epoch: 22/50, iter: 100/834, loss: 0.32280, lr: 0.906221, top1: 0.61146, throughput: 313.86 | 2022-04-11 04:08:02.671 [rank:3] [train], epoch: 22/50, iter: 100/834, loss: 0.32036, lr: 0.906221, top1: 0.61646, throughput: 313.60 | 2022-04-11 04:08:02.688 [rank:2] [train], epoch: 22/50, iter: 100/834, loss: 0.32371, lr: 0.906221, top1: 0.60641, throughput: 313.45 | 2022-04-11 04:08:02.710 [rank:1] [train], epoch: 22/50, iter: 100/834, loss: 0.31835, lr: 0.906221, top1: 0.61677, throughput: 313.64 | 2022-04-11 04:08:02.713 [rank:0] [train], epoch: 22/50, iter: 100/834, loss: 0.32264, lr: 0.906221, top1: 0.60365, throughput: 313.39 | 2022-04-11 04:08:02.719 [rank:6] [train], epoch: 22/50, iter: 100/834, loss: 0.32526, lr: 0.906221, top1: 0.60255, throughput: 313.49 | 2022-04-11 04:08:02.730 [rank:7] [train], epoch: 22/50, iter: 100/834, loss: 0.32502, lr: 0.906221, top1: 0.60073, throughput: 313.39 | 2022-04-11 04:08:02.745 [rank:4] [train], epoch: 22/50, iter: 200/834, loss: 0.32313, lr: 0.900526, top1: 0.60536, throughput: 312.57 | 2022-04-11 04:09:04.096 [rank:5] [train], epoch: 22/50, iter: 200/834, loss: 0.32425, lr: 0.900526, top1: 0.60714, throughput: 312.41 | 2022-04-11 04:09:04.118 [rank:3] [train], epoch: 22/50, iter: 200/834, loss: 0.32320, lr: 0.900526, top1: 0.60703, throughput: 312.42 | 2022-04-11 04:09:04.144 [rank:0] [train], epoch: 22/50, iter: 200/834, loss: 0.32140, lr: 0.900526, top1: 0.61167, throughput: 312.58 | 2022-04-11 04:09:04.144 [rank:2] [train], epoch: 22/50, iter: 200/834, loss: 0.32279, lr: 0.900526, top1: 0.61333, throughput: 312.49 | 2022-04-11 04:09:04.151 [rank:7] [train], epoch: 22/50, iter: 200/834, loss: 0.32549, lr: 0.900526, top1: 0.60177, throughput: 313.07 | 2022-04-11 04:09:04.073 [rank:1] [train], epoch: 22/50, iter: 200/834, loss: 0.32172, lr: 0.900526, top1: 0.60969, throughput: 312.86 | 2022-04-11 04:09:04.082 [rank:6] [train], epoch: 22/50, iter: 200/834, loss: 0.32648, lr: 0.900526, top1: 0.60036, throughput: 312.36 | 2022-04-11 04:09:04.197 [rank:1] [train], epoch: 22/50, iter: 300/834, loss: 0.32554, lr: 0.894823, top1: 0.60156, throughput: 312.77 | 2022-04-11 04:10:05.469 [rank:2] [train], epoch: 22/50, iter: 300/834, loss: 0.32532, lr: 0.894823, top1: 0.60219, throughput: 313.11 | 2022-04-11 04:10:05.470 [rank:6] [train], epoch: 22/50, iter: 300/834, loss: 0.32482, lr: 0.894823, top1: 0.60396, throughput: 313.33 | 2022-04-11 04:10:05.473 [rank:3] [train], epoch: 22/50, iter: 300/834, loss: 0.32583, lr: 0.894823, top1: 0.60214, throughput: 312.91 | 2022-04-11 04:10:05.503 [rank:4] [train], epoch: 22/50, iter: 300/834, loss: 0.32480, lr: 0.894823, top1: 0.60182, throughput: 312.63 | 2022-04-11 04:10:05.510 [rank:5] [train], epoch: 22/50, iter: 300/834, loss: 0.32569, lr: 0.894823, top1: 0.60078, throughput: 312.71 | 2022-04-11 04:10:05.517 [rank:0] [train], epoch: 22/50, iter: 300/834, loss: 0.32763, lr: 0.894823, top1: 0.59807, throughput: 312.83 | 2022-04-11 04:10:05.520 [rank:7] [train], epoch: 22/50, iter: 300/834, loss: 0.32568, lr: 0.894823, top1: 0.60589, throughput: 312.33 | 2022-04-11 04:10:05.547 [rank:7] [train], epoch: 22/50, iter: 400/834, loss: 0.32256, lr: 0.889113, top1: 0.60448, throughput: 314.68 | 2022-04-11 04:11:06.562 [rank:6] [train], epoch: 22/50, iter: 400/834, loss: 0.32183, lr: 0.889113, top1: 0.60719, throughput: 314.25 | 2022-04-11 04:11:06.571 [rank:2] [train], epoch: 22/50, iter: 400/834, loss: 0.32471, lr: 0.889113, top1: 0.60172, throughput: 314.19 | 2022-04-11 04:11:06.581 [rank:1] [train], epoch: 22/50, iter: 400/834, loss: 0.32451, lr: 0.889113, top1: 0.59875, throughput: 314.16 | 2022-04-11 04:11:06.585 [rank:0] [train], epoch: 22/50, iter: 400/834, loss: 0.32313, lr: 0.889113, top1: 0.60797, throughput: 314.31 | 2022-04-11 04:11:06.607 [rank:3] [train], epoch: 22/50, iter: 400/834, loss: 0.32458, lr: 0.889113, top1: 0.60115, throughput: 314.21 | 2022-04-11 04:11:06.608 [rank:4] [train], epoch: 22/50, iter: 400/834, loss: 0.32544, lr: 0.889113, top1: 0.59667, throughput: 314.18 | 2022-04-11 04:11:06.622 [rank:5] [train], epoch: 22/50, iter: 400/834, loss: 0.32353, lr: 0.889113, top1: 0.60344, throughput: 314.11 | 2022-04-11 04:11:06.643 [rank:5] [train], epoch: 22/50, iter: 500/834, loss: 0.32305, lr: 0.883396, top1: 0.60839, throughput: 314.66 | 2022-04-11 04:12:07.661 [rank:2] [train], epoch: 22/50, iter: 500/834, loss: 0.32771, lr: 0.883396, top1: 0.59760, throughput: 314.21 | 2022-04-11 04:12:07.686 [rank:7] [train], epoch: 22/50, iter: 500/834, loss: 0.32659, lr: 0.883396, top1: 0.60234, throughput: 314.00 | 2022-04-11 04:12:07.709 [rank:4] [train], epoch: 22/50, iter: 500/834, loss: 0.32585, lr: 0.883396, top1: 0.60443, throughput: 314.29 | 2022-04-11 04:12:07.712 [rank:1] [train], epoch: 22/50, iter: 500/834, loss: 0.32635, lr: 0.883396, top1: 0.59833, throughput: 314.07 | 2022-04-11 04:12:07.718 [rank:0] [train], epoch: 22/50, iter: 500/834, loss: 0.32517, lr: 0.883396, top1: 0.60281, throughput: 314.14 | 2022-04-11 04:12:07.726 [rank:3] [train], epoch: 22/50, iter: 500/834, loss: 0.32693, lr: 0.883396, top1: 0.59844, throughput: 314.07 | 2022-04-11 04:12:07.741 [rank:6] [train], epoch: 22/50, iter: 500/834, loss: 0.32429, lr: 0.883396, top1: 0.60469, throughput: 313.82 | 2022-04-11 04:12:07.752 [rank:6] [train], epoch: 22/50, iter: 600/834, loss: 0.32577, lr: 0.877673, top1: 0.60156, throughput: 313.40 | 2022-04-11 04:13:09.017 [rank:2] [train], epoch: 22/50, iter: 600/834, loss: 0.32586, lr: 0.877673, top1: 0.60109, throughput: 312.83 | 2022-04-11 04:13:09.061 [rank:3] [train], epoch: 22/50, iter: 600/834, loss: 0.32648, lr: 0.877673, top1: 0.59630, throughput: 313.05 | 2022-04-11 04:13:09.074 [rank:5] [train], epoch: 22/50, iter: 600/834, loss: 0.32336, lr: 0.877673, top1: 0.60500, throughput: 312.59 | 2022-04-11 04:13:09.082 [rank:4] [train], epoch: 22/50, iter: 600/834, loss: 0.32465, lr: 0.877673, top1: 0.60734, throughput: 312.76 | 2022-04-11 04:13:09.101 [rank:0] [train], epoch: 22/50, iter: 600/834, loss: 0.32642, lr: 0.877673, top1: 0.60203, throughput: 312.59 | 2022-04-11 04:13:09.149 [rank:7] [train], epoch: 22/50, iter: 600/834, loss: 0.32399, lr: 0.877673, top1: 0.60427, throughput: 312.50 | 2022-04-11 04:13:09.150 [rank:1] [train], epoch: 22/50, iter: 600/834, loss: 0.32603, lr: 0.877673, top1: 0.59979, throughput: 312.82 | 2022-04-11 04:13:09.095 [rank:3] [train], epoch: 22/50, iter: 700/834, loss: 0.32701, lr: 0.871943, top1: 0.60234, throughput: 311.24 | 2022-04-11 04:14:10.762 [rank:4] [train], epoch: 22/50, iter: 700/834, loss: 0.32559, lr: 0.871943, top1: 0.60411, throughput: 311.29 | 2022-04-11 04:14:10.779 [rank:2] [train], epoch: 22/50, iter: 700/834, loss: 0.32459, lr: 0.871943, top1: 0.60328, throughput: 311.02 | 2022-04-11 04:14:10.792 [rank:1] [train], epoch: 22/50, iter: 700/834, loss: 0.32344, lr: 0.871943, top1: 0.60573, throughput: 311.19 | 2022-04-11 04:14:10.793 [rank:0] [train], epoch: 22/50, iter: 700/834, loss: 0.32392, lr: 0.871943, top1: 0.60708, throughput: 311.40 | 2022-04-11 04:14:10.806 [rank:7] [train], epoch: 22/50, iter: 700/834, loss: 0.32817, lr: 0.871943, top1: 0.59589, throughput: 311.41 | 2022-04-11 04:14:10.806 [rank:6] [train], epoch: 22/50, iter: 700/834, loss: 0.32847, lr: 0.871943, top1: 0.59714, throughput: 310.73 | 2022-04-11 04:14:10.806 [rank:5] [train], epoch: 22/50, iter: 700/834, loss: 0.32899, lr: 0.871943, top1: 0.59995, throughput: 310.90 | 2022-04-11 04:14:10.839 [rank:1] [train], epoch: 22/50, iter: 800/834, loss: 0.32301, lr: 0.866207, top1: 0.60984, throughput: 313.30 | 2022-04-11 04:15:12.076 [rank:0] [train], epoch: 22/50, iter: 800/834, loss: 0.32309, lr: 0.866207, top1: 0.60911, throughput: 313.31 | 2022-04-11 04:15:12.086 [rank:2] [train], epoch: 22/50, iter: 800/834, loss: 0.32572, lr: 0.866207, top1: 0.60047, throughput: 313.19 | 2022-04-11 04:15:12.098 [rank:7] [train], epoch: 22/50, iter: 800/834, loss: 0.32640, lr: 0.866207, top1: 0.59979, throughput: 313.10 | 2022-04-11 04:15:12.127 [rank:5] [train], epoch: 22/50, iter: 800/834, loss: 0.32823, lr: 0.866207, top1: 0.59568, throughput: 313.24 | 2022-04-11 04:15:12.135 [rank:3] [train], epoch: 22/50, iter: 800/834, loss: 0.32415, lr: 0.866207, top1: 0.59776, throughput: 312.83 | 2022-04-11 04:15:12.138 [rank:6] [train], epoch: 22/50, iter: 800/834, loss: 0.32496, lr: 0.866207, top1: 0.60422, throughput: 313.04 | 2022-04-11 04:15:12.139 [rank:4] [train], epoch: 22/50, iter: 800/834, loss: 0.32524, lr: 0.866207, top1: 0.59828, throughput: 312.86 | 2022-04-11 04:15:12.148 [rank:6] [train], epoch: 22/50, iter: 834/834, loss: 0.32498, lr: 0.864256, top1: 0.60447, throughput: 312.84 | 2022-04-11 04:15:33.006 [rank:4] [train], epoch: 22/50, iter: 834/834, loss: 0.32258, lr: 0.864256, top1: 0.60677, throughput: 312.17 | 2022-04-11 04:15:33.060 [rank:0] [train], epoch: 22/50, iter: 834/834, loss: 0.32938, lr: 0.864256, top1: 0.59804, throughput: 311.01 | 2022-04-11 04:15:33.076 [rank:5] [train], epoch: 22/50, iter: 834/834, loss: 0.32231, lr: 0.864256, top1: 0.60769, throughput: 311.72 | 2022-04-11 04:15:33.077 [rank:1] [train], epoch: 22/50, iter: 834/834, loss: 0.32447, lr: 0.864256, top1: 0.60600, throughput: 310.71 | 2022-04-11 04:15:33.085 [rank:7] [train], epoch: 22/50, iter: 834/834, loss: 0.32079, lr: 0.864256, top1: 0.61366, throughput: 311.31 | 2022-04-11 04:15:33.096 [rank:2] [train], epoch: 22/50, iter: 834/834, loss: 0.33149, lr: 0.864256, top1: 0.59176, throughput: 310.77 | 2022-04-11 04:15:33.103 [rank:3] [train], epoch: 22/50, iter: 834/834, loss: 0.32764, lr: 0.864256, top1: 0.59804, throughput: 310.61 | 2022-04-11 04:15:33.155 [rank:0] [eval], epoch: 22/50, iter: 125/125, loss: 0.00000, lr: 0.864256, top1: 0.61488, throughput: 485.68 | 2022-04-11 04:15:45.944 [rank:2] [eval], epoch: 22/50, iter: 125/125, loss: 0.00000, lr: 0.864256, top1: 0.61008, throughput: 486.57 | 2022-04-11 04:15:45.949 [rank:3] [eval], epoch: 22/50, iter: 125/125, loss: 0.00000, lr: 0.864256, top1: 0.61024, throughput: 488.24 | 2022-04-11 04:15:45.956 [rank:7] [eval], epoch: 22/50, iter: 125/125, loss: 0.00000, lr: 0.864256, top1: 0.61584, throughput: 485.60 | 2022-04-11 04:15:45.967 [rank:1] [eval], epoch: 22/50, iter: 125/125, loss: 0.00000, lr: 0.864256, top1: 0.61968, throughput: 485.13 | 2022-04-11 04:15:45.969 [rank:6] [eval], epoch: 22/50, iter: 125/125, loss: 0.00000, lr: 0.864256, top1: 0.61584, throughput: 482.07 | 2022-04-11 04:15:45.971 [rank:5] [eval], epoch: 22/50, iter: 125/125, loss: 0.00000, lr: 0.864256, top1: 0.59792, throughput: 484.53 | 2022-04-11 04:15:45.976 [rank:4] [eval], epoch: 22/50, iter: 125/125, loss: 0.00000, lr: 0.864256, top1: 0.60896, throughput: 483.30 | 2022-04-11 04:15:45.992 [rank:6] [train], epoch: 23/50, iter: 100/834, loss: 0.32291, lr: 0.858513, top1: 0.60307, throughput: 313.62 | 2022-04-11 04:16:47.191 [rank:4] [train], epoch: 23/50, iter: 100/834, loss: 0.32007, lr: 0.858513, top1: 0.61099, throughput: 313.57 | 2022-04-11 04:16:47.223 [rank:5] [train], epoch: 23/50, iter: 100/834, loss: 0.32090, lr: 0.858513, top1: 0.61089, throughput: 313.48 | 2022-04-11 04:16:47.224 [rank:0] [train], epoch: 23/50, iter: 100/834, loss: 0.32038, lr: 0.858513, top1: 0.61385, throughput: 313.27 | 2022-04-11 04:16:47.234 [rank:3] [train], epoch: 23/50, iter: 100/834, loss: 0.31761, lr: 0.858513, top1: 0.61818, throughput: 313.33 | 2022-04-11 04:16:47.234 [rank:1] [train], epoch: 23/50, iter: 100/834, loss: 0.31543, lr: 0.858513, top1: 0.62281, throughput: 313.32 | 2022-04-11 04:16:47.247 [rank:7] [train], epoch: 23/50, iter: 100/834, loss: 0.31755, lr: 0.858513, top1: 0.61938, throughput: 313.19 | 2022-04-11 04:16:47.272 [rank:2] [train], epoch: 23/50, iter: 100/834, loss: 0.31973, lr: 0.858513, top1: 0.61068, throughput: 313.09 | 2022-04-11 04:16:47.272 [rank:5] [train], epoch: 23/50, iter: 200/834, loss: 0.32229, lr: 0.852765, top1: 0.61042, throughput: 311.81 | 2022-04-11 04:17:48.800 [rank:4] [train], epoch: 23/50, iter: 200/834, loss: 0.32151, lr: 0.852765, top1: 0.60766, throughput: 311.79 | 2022-04-11 04:17:48.803 [rank:3] [train], epoch: 23/50, iter: 200/834, loss: 0.31718, lr: 0.852765, top1: 0.61885, throughput: 311.76 | 2022-04-11 04:17:48.820 [rank:7] [train], epoch: 23/50, iter: 200/834, loss: 0.31806, lr: 0.852765, top1: 0.61635, throughput: 311.82 | 2022-04-11 04:17:48.845 [rank:2] [train], epoch: 23/50, iter: 200/834, loss: 0.31934, lr: 0.852765, top1: 0.61385, throughput: 311.82 | 2022-04-11 04:17:48.846 [rank:0] [train], epoch: 23/50, iter: 200/834, loss: 0.32039, lr: 0.852765, top1: 0.61427, throughput: 311.62 | 2022-04-11 04:17:48.847 [rank:1] [train], epoch: 23/50, iter: 200/834, loss: 0.32254, lr: 0.852765, top1: 0.60896, throughput: 311.63 | 2022-04-11 04:17:48.859 [rank:6] [train], epoch: 23/50, iter: 200/834, loss: 0.31969, lr: 0.852765, top1: 0.61016, throughput: 311.27 | 2022-04-11 04:17:48.875 [rank:4] [train], epoch: 23/50, iter: 300/834, loss: 0.32156, lr: 0.847012, top1: 0.60911, throughput: 313.67 | 2022-04-11 04:18:50.013 [rank:7] [train], epoch: 23/50, iter: 300/834, loss: 0.32303, lr: 0.847012, top1: 0.60266, throughput: 313.81 | 2022-04-11 04:18:50.030 [rank:2] [train], epoch: 23/50, iter: 300/834, loss: 0.32154, lr: 0.847012, top1: 0.60917, throughput: 313.79 | 2022-04-11 04:18:50.033 [rank:5] [train], epoch: 23/50, iter: 300/834, loss: 0.32036, lr: 0.847012, top1: 0.61057, throughput: 313.49 | 2022-04-11 04:18:50.045 [rank:6] [train], epoch: 23/50, iter: 300/834, loss: 0.31988, lr: 0.847012, top1: 0.61156, throughput: 313.81 | 2022-04-11 04:18:50.059 [rank:0] [train], epoch: 23/50, iter: 300/834, loss: 0.32193, lr: 0.847012, top1: 0.60870, throughput: 313.66 | 2022-04-11 04:18:50.060 [rank:3] [train], epoch: 23/50, iter: 300/834, loss: 0.32172, lr: 0.847012, top1: 0.60677, throughput: 313.52 | 2022-04-11 04:18:50.061 [rank:1] [train], epoch: 23/50, iter: 300/834, loss: 0.32246, lr: 0.847012, top1: 0.60740, throughput: 314.04 | 2022-04-11 04:18:49.998 [rank:1] [train], epoch: 23/50, iter: 400/834, loss: 0.32141, lr: 0.841254, top1: 0.60995, throughput: 311.67 | 2022-04-11 04:19:51.600 [rank:7] [train], epoch: 23/50, iter: 400/834, loss: 0.32243, lr: 0.841254, top1: 0.60922, throughput: 311.77 | 2022-04-11 04:19:51.613 [rank:4] [train], epoch: 23/50, iter: 400/834, loss: 0.32086, lr: 0.841254, top1: 0.61031, throughput: 311.67 | 2022-04-11 04:19:51.616 [rank:2] [train], epoch: 23/50, iter: 400/834, loss: 0.32316, lr: 0.841254, top1: 0.60828, throughput: 311.77 | 2022-04-11 04:19:51.616 [rank:6] [train], epoch: 23/50, iter: 400/834, loss: 0.32085, lr: 0.841254, top1: 0.61036, throughput: 311.79 | 2022-04-11 04:19:51.639 [rank:5] [train], epoch: 23/50, iter: 400/834, loss: 0.32009, lr: 0.841254, top1: 0.61328, throughput: 311.67 | 2022-04-11 04:19:51.649 [rank:3] [train], epoch: 23/50, iter: 400/834, loss: 0.32023, lr: 0.841254, top1: 0.61250, throughput: 311.68 | 2022-04-11 04:19:51.663 [rank:0] [train], epoch: 23/50, iter: 400/834, loss: 0.31930, lr: 0.841254, top1: 0.61823, throughput: 311.67 | 2022-04-11 04:19:51.664 [rank:4] [train], epoch: 23/50, iter: 500/834, loss: 0.32230, lr: 0.835493, top1: 0.60286, throughput: 313.47 | 2022-04-11 04:20:52.866 [rank:7] [train], epoch: 23/50, iter: 500/834, loss: 0.32137, lr: 0.835493, top1: 0.60792, throughput: 313.43 | 2022-04-11 04:20:52.870 [rank:6] [train], epoch: 23/50, iter: 500/834, loss: 0.32223, lr: 0.835493, top1: 0.60776, throughput: 313.47 | 2022-04-11 04:20:52.888 [rank:2] [train], epoch: 23/50, iter: 500/834, loss: 0.32521, lr: 0.835493, top1: 0.60125, throughput: 313.30 | 2022-04-11 04:20:52.898 [rank:1] [train], epoch: 23/50, iter: 500/834, loss: 0.32610, lr: 0.835493, top1: 0.60234, throughput: 313.17 | 2022-04-11 04:20:52.910 [rank:0] [train], epoch: 23/50, iter: 500/834, loss: 0.32147, lr: 0.835493, top1: 0.60901, throughput: 313.42 | 2022-04-11 04:20:52.923 [rank:3] [train], epoch: 23/50, iter: 500/834, loss: 0.32049, lr: 0.835493, top1: 0.61062, throughput: 313.41 | 2022-04-11 04:20:52.924 [rank:5] [train], epoch: 23/50, iter: 500/834, loss: 0.32349, lr: 0.835493, top1: 0.60307, throughput: 313.29 | 2022-04-11 04:20:52.934 [rank:4] [train], epoch: 23/50, iter: 600/834, loss: 0.32310, lr: 0.829727, top1: 0.60719, throughput: 314.71 | 2022-04-11 04:21:53.875 [rank:1] [train], epoch: 23/50, iter: 600/834, loss: 0.32203, lr: 0.829727, top1: 0.60786, throughput: 314.88 | 2022-04-11 04:21:53.886 [rank:5] [train], epoch: 23/50, iter: 600/834, loss: 0.32384, lr: 0.829727, top1: 0.60406, throughput: 314.94 | 2022-04-11 04:21:53.899 [rank:0] [train], epoch: 23/50, iter: 600/834, loss: 0.31866, lr: 0.829727, top1: 0.61385, throughput: 314.84 | 2022-04-11 04:21:53.906 [rank:6] [train], epoch: 23/50, iter: 600/834, loss: 0.32076, lr: 0.829727, top1: 0.61021, throughput: 314.58 | 2022-04-11 04:21:53.921 [rank:7] [train], epoch: 23/50, iter: 600/834, loss: 0.32240, lr: 0.829727, top1: 0.60740, throughput: 314.31 | 2022-04-11 04:21:53.956 [rank:3] [train], epoch: 23/50, iter: 600/834, loss: 0.32419, lr: 0.829727, top1: 0.60531, throughput: 314.50 | 2022-04-11 04:21:53.973 [rank:2] [train], epoch: 23/50, iter: 600/834, loss: 0.32290, lr: 0.829727, top1: 0.60240, throughput: 314.78 | 2022-04-11 04:21:53.892 [rank:7] [train], epoch: 23/50, iter: 700/834, loss: 0.32243, lr: 0.823958, top1: 0.61052, throughput: 313.86 | 2022-04-11 04:22:55.131 [rank:3] [train], epoch: 23/50, iter: 700/834, loss: 0.32459, lr: 0.823958, top1: 0.60214, throughput: 313.89 | 2022-04-11 04:22:55.140 [rank:2] [train], epoch: 23/50, iter: 700/834, loss: 0.32281, lr: 0.823958, top1: 0.60656, throughput: 313.44 | 2022-04-11 04:22:55.147 [rank:0] [train], epoch: 23/50, iter: 700/834, loss: 0.32179, lr: 0.823958, top1: 0.60844, throughput: 313.44 | 2022-04-11 04:22:55.162 [rank:5] [train], epoch: 23/50, iter: 700/834, loss: 0.32087, lr: 0.823958, top1: 0.60698, throughput: 313.37 | 2022-04-11 04:22:55.169 [rank:1] [train], epoch: 23/50, iter: 700/834, loss: 0.32214, lr: 0.823958, top1: 0.60807, throughput: 313.23 | 2022-04-11 04:22:55.182 [rank:6] [train], epoch: 23/50, iter: 700/834, loss: 0.32126, lr: 0.823958, top1: 0.61339, throughput: 313.37 | 2022-04-11 04:22:55.190 [rank:4] [train], epoch: 23/50, iter: 700/834, loss: 0.32121, lr: 0.823958, top1: 0.60865, throughput: 313.11 | 2022-04-11 04:22:55.196 [rank:7] [train], epoch: 23/50, iter: 800/834, loss: 0.32520, lr: 0.818186, top1: 0.60469, throughput: 311.69 | 2022-04-11 04:23:56.730 [rank:4] [train], epoch: 23/50, iter: 800/834, loss: 0.31852, lr: 0.818186, top1: 0.61464, throughput: 311.76 | 2022-04-11 04:23:56.781 [rank:1] [train], epoch: 23/50, iter: 800/834, loss: 0.32445, lr: 0.818186, top1: 0.60687, throughput: 311.54 | 2022-04-11 04:23:56.811 [rank:5] [train], epoch: 23/50, iter: 800/834, loss: 0.32120, lr: 0.818186, top1: 0.61125, throughput: 311.44 | 2022-04-11 04:23:56.817 [rank:6] [train], epoch: 23/50, iter: 800/834, loss: 0.32632, lr: 0.818186, top1: 0.60005, throughput: 311.55 | 2022-04-11 04:23:56.818 [rank:0] [train], epoch: 23/50, iter: 800/834, loss: 0.32393, lr: 0.818186, top1: 0.60552, throughput: 311.32 | 2022-04-11 04:23:56.834 [rank:3] [train], epoch: 23/50, iter: 800/834, loss: 0.32373, lr: 0.818186, top1: 0.60391, throughput: 311.06 | 2022-04-11 04:23:56.864 [rank:2] [train], epoch: 23/50, iter: 800/834, loss: 0.32257, lr: 0.818186, top1: 0.60781, throughput: 311.09 | 2022-04-11 04:23:56.866 [rank:2] [train], epoch: 23/50, iter: 834/834, loss: 0.32211, lr: 0.816223, top1: 0.60983, throughput: 313.87 | 2022-04-11 04:24:17.664 [rank:5] [train], epoch: 23/50, iter: 834/834, loss: 0.32288, lr: 0.816223, top1: 0.59896, throughput: 313.09 | 2022-04-11 04:24:17.667 [rank:4] [train], epoch: 23/50, iter: 834/834, loss: 0.31857, lr: 0.816223, top1: 0.61550, throughput: 312.51 | 2022-04-11 04:24:17.670 [rank:0] [train], epoch: 23/50, iter: 834/834, loss: 0.32215, lr: 0.816223, top1: 0.61627, throughput: 313.27 | 2022-04-11 04:24:17.673 [rank:6] [train], epoch: 23/50, iter: 834/834, loss: 0.31843, lr: 0.816223, top1: 0.60723, throughput: 312.96 | 2022-04-11 04:24:17.677 [rank:1] [train], epoch: 23/50, iter: 834/834, loss: 0.31792, lr: 0.816223, top1: 0.61443, throughput: 312.63 | 2022-04-11 04:24:17.691 [rank:7] [train], epoch: 23/50, iter: 834/834, loss: 0.32333, lr: 0.816223, top1: 0.60080, throughput: 311.34 | 2022-04-11 04:24:17.697 [rank:3] [train], epoch: 23/50, iter: 834/834, loss: 0.32515, lr: 0.816223, top1: 0.60937, throughput: 313.32 | 2022-04-11 04:24:17.699 [rank:2] [eval], epoch: 23/50, iter: 125/125, loss: 0.00000, lr: 0.816223, top1: 0.61248, throughput: 485.79 | 2022-04-11 04:24:30.530 [rank:0] [eval], epoch: 23/50, iter: 125/125, loss: 0.00000, lr: 0.816223, top1: 0.62688, throughput: 486.07 | 2022-04-11 04:24:30.531 [rank:1] [eval], epoch: 23/50, iter: 125/125, loss: 0.00000, lr: 0.816223, top1: 0.61920, throughput: 486.36 | 2022-04-11 04:24:30.542 [rank:7] [eval], epoch: 23/50, iter: 125/125, loss: 0.00000, lr: 0.816223, top1: 0.61216, throughput: 486.56 | 2022-04-11 04:24:30.543 [rank:5] [eval], epoch: 23/50, iter: 125/125, loss: 0.00000, lr: 0.816223, top1: 0.60608, throughput: 485.06 | 2022-04-11 04:24:30.552 [rank:3] [eval], epoch: 23/50, iter: 125/125, loss: 0.00000, lr: 0.816223, top1: 0.61440, throughput: 486.04 | 2022-04-11 04:24:30.558 [rank:6] [eval], epoch: 23/50, iter: 125/125, loss: 0.00000, lr: 0.816223, top1: 0.61792, throughput: 485.13 | 2022-04-11 04:24:30.560 [rank:4] [eval], epoch: 23/50, iter: 125/125, loss: 0.00000, lr: 0.816223, top1: 0.61744, throughput: 484.48 | 2022-04-11 04:24:30.570 [rank:1] [train], epoch: 24/50, iter: 100/834, loss: 0.31600, lr: 0.810447, top1: 0.62120, throughput: 312.74 | 2022-04-11 04:25:31.934 [rank:0] [train], epoch: 24/50, iter: 100/834, loss: 0.31642, lr: 0.810447, top1: 0.61969, throughput: 312.55 | 2022-04-11 04:25:31.961 [rank:4] [train], epoch: 24/50, iter: 100/834, loss: 0.31597, lr: 0.810447, top1: 0.62115, throughput: 312.69 | 2022-04-11 04:25:31.973 [rank:7] [train], epoch: 24/50, iter: 100/834, loss: 0.31760, lr: 0.810447, top1: 0.61500, throughput: 312.53 | 2022-04-11 04:25:31.977 [rank:3] [train], epoch: 24/50, iter: 100/834, loss: 0.31828, lr: 0.810447, top1: 0.61479, throughput: 312.56 | 2022-04-11 04:25:31.986 [rank:5] [train], epoch: 24/50, iter: 100/834, loss: 0.31765, lr: 0.810447, top1: 0.61589, throughput: 312.54 | 2022-04-11 04:25:31.985 [rank:2] [train], epoch: 24/50, iter: 100/834, loss: 0.31733, lr: 0.810447, top1: 0.61745, throughput: 312.38 | 2022-04-11 04:25:31.993 [rank:6] [train], epoch: 24/50, iter: 100/834, loss: 0.31432, lr: 0.810447, top1: 0.62427, throughput: 312.89 | 2022-04-11 04:25:31.922 [rank:5] [train], epoch: 24/50, iter: 200/834, loss: 0.31882, lr: 0.804669, top1: 0.61255, throughput: 312.08 | 2022-04-11 04:26:33.508 [rank:7] [train], epoch: 24/50, iter: 200/834, loss: 0.31925, lr: 0.804669, top1: 0.61323, throughput: 311.96 | 2022-04-11 04:26:33.523 [rank:2] [train], epoch: 24/50, iter: 200/834, loss: 0.31622, lr: 0.804669, top1: 0.61682, throughput: 312.03 | 2022-04-11 04:26:33.526 [rank:4] [train], epoch: 24/50, iter: 200/834, loss: 0.31732, lr: 0.804669, top1: 0.61620, throughput: 311.91 | 2022-04-11 04:26:33.529 [rank:3] [train], epoch: 24/50, iter: 200/834, loss: 0.31800, lr: 0.804669, top1: 0.61302, throughput: 311.92 | 2022-04-11 04:26:33.541 [rank:1] [train], epoch: 24/50, iter: 200/834, loss: 0.31837, lr: 0.804669, top1: 0.61656, throughput: 311.64 | 2022-04-11 04:26:33.543 [rank:6] [train], epoch: 24/50, iter: 200/834, loss: 0.31852, lr: 0.804669, top1: 0.61073, throughput: 311.55 | 2022-04-11 04:26:33.549 [rank:0] [train], epoch: 24/50, iter: 200/834, loss: 0.31864, lr: 0.804669, top1: 0.61661, throughput: 311.67 | 2022-04-11 04:26:33.564 [rank:0] [train], epoch: 24/50, iter: 300/834, loss: 0.31811, lr: 0.798889, top1: 0.61406, throughput: 312.46 | 2022-04-11 04:27:35.012 [rank:6] [train], epoch: 24/50, iter: 300/834, loss: 0.31698, lr: 0.798889, top1: 0.62182, throughput: 312.31 | 2022-04-11 04:27:35.026 [rank:2] [train], epoch: 24/50, iter: 300/834, loss: 0.32114, lr: 0.798889, top1: 0.60906, throughput: 312.14 | 2022-04-11 04:27:35.037 [rank:4] [train], epoch: 24/50, iter: 300/834, loss: 0.31880, lr: 0.798889, top1: 0.61359, throughput: 312.12 | 2022-04-11 04:27:35.044 [rank:5] [train], epoch: 24/50, iter: 300/834, loss: 0.32087, lr: 0.798889, top1: 0.60917, throughput: 312.01 | 2022-04-11 04:27:35.044 [rank:1] [train], epoch: 24/50, iter: 300/834, loss: 0.31683, lr: 0.798889, top1: 0.62135, throughput: 312.11 | 2022-04-11 04:27:35.060 [rank:7] [train], epoch: 24/50, iter: 300/834, loss: 0.31667, lr: 0.798889, top1: 0.61703, throughput: 311.97 | 2022-04-11 04:27:35.067 [rank:3] [train], epoch: 24/50, iter: 300/834, loss: 0.31751, lr: 0.798889, top1: 0.61755, throughput: 312.06 | 2022-04-11 04:27:35.068 [rank:1] [train], epoch: 24/50, iter: 400/834, loss: 0.32052, lr: 0.793107, top1: 0.61146, throughput: 314.13 | 2022-04-11 04:28:36.182 [rank:0] [train], epoch: 24/50, iter: 400/834, loss: 0.31786, lr: 0.793107, top1: 0.61536, throughput: 313.88 | 2022-04-11 04:28:36.183 [rank:7] [train], epoch: 24/50, iter: 400/834, loss: 0.32067, lr: 0.793107, top1: 0.61161, throughput: 314.15 | 2022-04-11 04:28:36.184 [rank:6] [train], epoch: 24/50, iter: 400/834, loss: 0.31879, lr: 0.793107, top1: 0.61443, throughput: 313.92 | 2022-04-11 04:28:36.189 [rank:2] [train], epoch: 24/50, iter: 400/834, loss: 0.31660, lr: 0.793107, top1: 0.61724, throughput: 313.97 | 2022-04-11 04:28:36.189 [rank:4] [train], epoch: 24/50, iter: 400/834, loss: 0.32078, lr: 0.793107, top1: 0.61208, throughput: 313.94 | 2022-04-11 04:28:36.203 [rank:5] [train], epoch: 24/50, iter: 400/834, loss: 0.31785, lr: 0.793107, top1: 0.61771, throughput: 313.93 | 2022-04-11 04:28:36.204 [rank:3] [train], epoch: 24/50, iter: 400/834, loss: 0.31608, lr: 0.793107, top1: 0.62005, throughput: 314.00 | 2022-04-11 04:28:36.215 [rank:2] [train], epoch: 24/50, iter: 500/834, loss: 0.32382, lr: 0.787323, top1: 0.60479, throughput: 314.71 | 2022-04-11 04:29:37.197 [rank:4] [train], epoch: 24/50, iter: 500/834, loss: 0.31804, lr: 0.787323, top1: 0.61490, throughput: 314.70 | 2022-04-11 04:29:37.213 [rank:7] [train], epoch: 24/50, iter: 500/834, loss: 0.31962, lr: 0.787323, top1: 0.61385, throughput: 314.41 | 2022-04-11 04:29:37.251 [rank:6] [train], epoch: 24/50, iter: 500/834, loss: 0.31866, lr: 0.787323, top1: 0.61417, throughput: 314.40 | 2022-04-11 04:29:37.257 [rank:0] [train], epoch: 24/50, iter: 500/834, loss: 0.31924, lr: 0.787323, top1: 0.61047, throughput: 314.35 | 2022-04-11 04:29:37.262 [rank:3] [train], epoch: 24/50, iter: 500/834, loss: 0.31870, lr: 0.787323, top1: 0.61406, throughput: 314.45 | 2022-04-11 04:29:37.274 [rank:1] [train], epoch: 24/50, iter: 500/834, loss: 0.31713, lr: 0.787323, top1: 0.61604, throughput: 314.18 | 2022-04-11 04:29:37.294 [rank:5] [train], epoch: 24/50, iter: 500/834, loss: 0.31814, lr: 0.787323, top1: 0.61312, throughput: 314.22 | 2022-04-11 04:29:37.309 [rank:0] [train], epoch: 24/50, iter: 600/834, loss: 0.31934, lr: 0.781538, top1: 0.61208, throughput: 313.67 | 2022-04-11 04:30:38.473 [rank:5] [train], epoch: 24/50, iter: 600/834, loss: 0.32138, lr: 0.781538, top1: 0.60661, throughput: 313.78 | 2022-04-11 04:30:38.499 [rank:7] [train], epoch: 24/50, iter: 600/834, loss: 0.31805, lr: 0.781538, top1: 0.61047, throughput: 313.48 | 2022-04-11 04:30:38.500 [rank:3] [train], epoch: 24/50, iter: 600/834, loss: 0.32028, lr: 0.781538, top1: 0.61141, throughput: 313.56 | 2022-04-11 04:30:38.506 [rank:2] [train], epoch: 24/50, iter: 600/834, loss: 0.32155, lr: 0.781538, top1: 0.60781, throughput: 313.16 | 2022-04-11 04:30:38.508 [rank:4] [train], epoch: 24/50, iter: 600/834, loss: 0.32119, lr: 0.781538, top1: 0.61271, throughput: 313.23 | 2022-04-11 04:30:38.510 [rank:6] [train], epoch: 24/50, iter: 600/834, loss: 0.31734, lr: 0.781538, top1: 0.61187, throughput: 313.42 | 2022-04-11 04:30:38.517 [rank:1] [train], epoch: 24/50, iter: 600/834, loss: 0.31843, lr: 0.781538, top1: 0.61901, throughput: 313.56 | 2022-04-11 04:30:38.527 [rank:6] [train], epoch: 24/50, iter: 700/834, loss: 0.32123, lr: 0.775753, top1: 0.61120, throughput: 313.80 | 2022-04-11 04:31:39.702 [rank:1] [train], epoch: 24/50, iter: 700/834, loss: 0.31914, lr: 0.775753, top1: 0.61547, throughput: 313.75 | 2022-04-11 04:31:39.721 [rank:5] [train], epoch: 24/50, iter: 700/834, loss: 0.31920, lr: 0.775753, top1: 0.61115, throughput: 313.56 | 2022-04-11 04:31:39.732 [rank:4] [train], epoch: 24/50, iter: 700/834, loss: 0.31831, lr: 0.775753, top1: 0.61578, throughput: 313.60 | 2022-04-11 04:31:39.735 [rank:0] [train], epoch: 24/50, iter: 700/834, loss: 0.31822, lr: 0.775753, top1: 0.61776, throughput: 313.27 | 2022-04-11 04:31:39.762 [rank:2] [train], epoch: 24/50, iter: 700/834, loss: 0.31967, lr: 0.775753, top1: 0.61047, throughput: 313.84 | 2022-04-11 04:31:39.685 [rank:3] [train], epoch: 24/50, iter: 700/834, loss: 0.31886, lr: 0.775753, top1: 0.60964, throughput: 313.34 | 2022-04-11 04:31:39.782 [rank:7] [train], epoch: 24/50, iter: 700/834, loss: 0.31832, lr: 0.775753, top1: 0.61594, throughput: 313.24 | 2022-04-11 04:31:39.794 [rank:2] [train], epoch: 24/50, iter: 800/834, loss: 0.31929, lr: 0.769967, top1: 0.60766, throughput: 312.13 | 2022-04-11 04:32:41.197 [rank:0] [train], epoch: 24/50, iter: 800/834, loss: 0.32089, lr: 0.769967, top1: 0.60474, throughput: 312.41 | 2022-04-11 04:32:41.219 [rank:1] [train], epoch: 24/50, iter: 800/834, loss: 0.32125, lr: 0.769967, top1: 0.61094, throughput: 312.19 | 2022-04-11 04:32:41.223 [rank:5] [train], epoch: 24/50, iter: 800/834, loss: 0.31728, lr: 0.769967, top1: 0.61599, throughput: 312.24 | 2022-04-11 04:32:41.224 [rank:6] [train], epoch: 24/50, iter: 800/834, loss: 0.32167, lr: 0.769967, top1: 0.60323, throughput: 312.03 | 2022-04-11 04:32:41.236 [rank:3] [train], epoch: 24/50, iter: 800/834, loss: 0.31900, lr: 0.769967, top1: 0.61432, throughput: 312.32 | 2022-04-11 04:32:41.256 [rank:7] [train], epoch: 24/50, iter: 800/834, loss: 0.31861, lr: 0.769967, top1: 0.61719, throughput: 312.38 | 2022-04-11 04:32:41.257 [rank:4] [train], epoch: 24/50, iter: 800/834, loss: 0.31985, lr: 0.769967, top1: 0.61313, throughput: 312.05 | 2022-04-11 04:32:41.263 [rank:5] [train], epoch: 24/50, iter: 834/834, loss: 0.31838, lr: 0.768000, top1: 0.61397, throughput: 312.79 | 2022-04-11 04:33:02.094 [rank:0] [train], epoch: 24/50, iter: 834/834, loss: 0.32118, lr: 0.768000, top1: 0.60983, throughput: 312.63 | 2022-04-11 04:33:02.100 [rank:2] [train], epoch: 24/50, iter: 834/834, loss: 0.32319, lr: 0.768000, top1: 0.61780, throughput: 312.15 | 2022-04-11 04:33:02.110 [rank:1] [train], epoch: 24/50, iter: 834/834, loss: 0.32061, lr: 0.768000, top1: 0.61320, throughput: 312.47 | 2022-04-11 04:33:02.114 [rank:4] [train], epoch: 24/50, iter: 834/834, loss: 0.32026, lr: 0.768000, top1: 0.61259, throughput: 313.04 | 2022-04-11 04:33:02.117 [rank:7] [train], epoch: 24/50, iter: 834/834, loss: 0.31962, lr: 0.768000, top1: 0.60922, throughput: 312.88 | 2022-04-11 04:33:02.122 [rank:6] [train], epoch: 24/50, iter: 834/834, loss: 0.31639, lr: 0.768000, top1: 0.61749, throughput: 312.11 | 2022-04-11 04:33:02.151 [rank:3] [train], epoch: 24/50, iter: 834/834, loss: 0.32086, lr: 0.768000, top1: 0.60800, throughput: 312.32 | 2022-04-11 04:33:02.158 [rank:0] [eval], epoch: 24/50, iter: 125/125, loss: 0.00000, lr: 0.768000, top1: 0.63552, throughput: 481.91 | 2022-04-11 04:33:15.069 [rank:2] [eval], epoch: 24/50, iter: 125/125, loss: 0.00000, lr: 0.768000, top1: 0.62768, throughput: 482.20 | 2022-04-11 04:33:15.072 [rank:7] [eval], epoch: 24/50, iter: 125/125, loss: 0.00000, lr: 0.768000, top1: 0.62880, throughput: 482.10 | 2022-04-11 04:33:15.086 [rank:6] [eval], epoch: 24/50, iter: 125/125, loss: 0.00000, lr: 0.768000, top1: 0.63424, throughput: 483.00 | 2022-04-11 04:33:15.091 [rank:3] [eval], epoch: 24/50, iter: 125/125, loss: 0.00000, lr: 0.768000, top1: 0.61968, throughput: 482.89 | 2022-04-11 04:33:15.101 [rank:4] [eval], epoch: 24/50, iter: 125/125, loss: 0.00000, lr: 0.768000, top1: 0.63072, throughput: 481.21 | 2022-04-11 04:33:15.105 [rank:1] [eval], epoch: 24/50, iter: 125/125, loss: 0.00000, lr: 0.768000, top1: 0.63520, throughput: 481.08 | 2022-04-11 04:33:15.106 [rank:5] [eval], epoch: 24/50, iter: 125/125, loss: 0.00000, lr: 0.768000, top1: 0.61616, throughput: 480.25 | 2022-04-11 04:33:15.108 [rank:6] [train], epoch: 25/50, iter: 100/834, loss: 0.31535, lr: 0.762214, top1: 0.62266, throughput: 314.26 | 2022-04-11 04:34:16.186 [rank:0] [train], epoch: 25/50, iter: 100/834, loss: 0.31270, lr: 0.762214, top1: 0.62349, throughput: 314.08 | 2022-04-11 04:34:16.200 [rank:4] [train], epoch: 25/50, iter: 100/834, loss: 0.31300, lr: 0.762214, top1: 0.62802, throughput: 314.14 | 2022-04-11 04:34:16.225 [rank:7] [train], epoch: 25/50, iter: 100/834, loss: 0.31231, lr: 0.762214, top1: 0.63068, throughput: 313.96 | 2022-04-11 04:34:16.241 [rank:1] [train], epoch: 25/50, iter: 100/834, loss: 0.30971, lr: 0.762214, top1: 0.63391, throughput: 313.97 | 2022-04-11 04:34:16.258 [rank:2] [train], epoch: 25/50, iter: 100/834, loss: 0.31552, lr: 0.762214, top1: 0.62078, throughput: 313.76 | 2022-04-11 04:34:16.264 [rank:5] [train], epoch: 25/50, iter: 100/834, loss: 0.31205, lr: 0.762214, top1: 0.62609, throughput: 313.86 | 2022-04-11 04:34:16.281 [rank:3] [train], epoch: 25/50, iter: 100/834, loss: 0.31345, lr: 0.762214, top1: 0.62536, throughput: 313.81 | 2022-04-11 04:34:16.284 [rank:0] [train], epoch: 25/50, iter: 200/834, loss: 0.31273, lr: 0.756429, top1: 0.62922, throughput: 312.34 | 2022-04-11 04:35:17.673 [rank:7] [train], epoch: 25/50, iter: 200/834, loss: 0.31310, lr: 0.756429, top1: 0.62286, throughput: 312.49 | 2022-04-11 04:35:17.683 [rank:6] [train], epoch: 25/50, iter: 200/834, loss: 0.31291, lr: 0.756429, top1: 0.62552, throughput: 312.17 | 2022-04-11 04:35:17.692 [rank:1] [train], epoch: 25/50, iter: 200/834, loss: 0.31543, lr: 0.756429, top1: 0.62260, throughput: 312.50 | 2022-04-11 04:35:17.699 [rank:5] [train], epoch: 25/50, iter: 200/834, loss: 0.31577, lr: 0.756429, top1: 0.61599, throughput: 312.60 | 2022-04-11 04:35:17.701 [rank:3] [train], epoch: 25/50, iter: 200/834, loss: 0.31337, lr: 0.756429, top1: 0.62870, throughput: 312.53 | 2022-04-11 04:35:17.718 [rank:2] [train], epoch: 25/50, iter: 200/834, loss: 0.31374, lr: 0.756429, top1: 0.62432, throughput: 312.41 | 2022-04-11 04:35:17.722 [rank:4] [train], epoch: 25/50, iter: 200/834, loss: 0.31206, lr: 0.756429, top1: 0.62557, throughput: 312.21 | 2022-04-11 04:35:17.722 [rank:2] [train], epoch: 25/50, iter: 300/834, loss: 0.31667, lr: 0.750644, top1: 0.61818, throughput: 314.04 | 2022-04-11 04:36:18.861 [rank:0] [train], epoch: 25/50, iter: 300/834, loss: 0.31393, lr: 0.750644, top1: 0.62146, throughput: 313.68 | 2022-04-11 04:36:18.882 [rank:7] [train], epoch: 25/50, iter: 300/834, loss: 0.31682, lr: 0.750644, top1: 0.61453, throughput: 313.72 | 2022-04-11 04:36:18.884 [rank:4] [train], epoch: 25/50, iter: 300/834, loss: 0.31656, lr: 0.750644, top1: 0.61870, throughput: 313.74 | 2022-04-11 04:36:18.919 [rank:5] [train], epoch: 25/50, iter: 300/834, loss: 0.31627, lr: 0.750644, top1: 0.61964, throughput: 313.56 | 2022-04-11 04:36:18.933 [rank:1] [train], epoch: 25/50, iter: 300/834, loss: 0.31401, lr: 0.750644, top1: 0.62286, throughput: 313.51 | 2022-04-11 04:36:18.940 [rank:6] [train], epoch: 25/50, iter: 300/834, loss: 0.31417, lr: 0.750644, top1: 0.62182, throughput: 313.85 | 2022-04-11 04:36:18.868 [rank:3] [train], epoch: 25/50, iter: 300/834, loss: 0.31269, lr: 0.750644, top1: 0.62750, throughput: 313.50 | 2022-04-11 04:36:18.963 [rank:2] [train], epoch: 25/50, iter: 400/834, loss: 0.31325, lr: 0.744860, top1: 0.61995, throughput: 311.85 | 2022-04-11 04:37:20.428 [rank:5] [train], epoch: 25/50, iter: 400/834, loss: 0.31717, lr: 0.744860, top1: 0.61615, throughput: 312.19 | 2022-04-11 04:37:20.433 [rank:0] [train], epoch: 25/50, iter: 400/834, loss: 0.31607, lr: 0.744860, top1: 0.61714, throughput: 311.89 | 2022-04-11 04:37:20.442 [rank:1] [train], epoch: 25/50, iter: 400/834, loss: 0.31942, lr: 0.744860, top1: 0.61443, throughput: 311.97 | 2022-04-11 04:37:20.485 [rank:7] [train], epoch: 25/50, iter: 400/834, loss: 0.31649, lr: 0.744860, top1: 0.61911, throughput: 311.98 | 2022-04-11 04:37:20.426 [rank:3] [train], epoch: 25/50, iter: 400/834, loss: 0.31667, lr: 0.744860, top1: 0.61859, throughput: 312.47 | 2022-04-11 04:37:20.410 [rank:4] [train], epoch: 25/50, iter: 400/834, loss: 0.31785, lr: 0.744860, top1: 0.61510, throughput: 311.83 | 2022-04-11 04:37:20.491 [rank:6] [train], epoch: 25/50, iter: 400/834, loss: 0.31769, lr: 0.744860, top1: 0.61635, throughput: 311.47 | 2022-04-11 04:37:20.512 [rank:5] [train], epoch: 25/50, iter: 500/834, loss: 0.31754, lr: 0.739077, top1: 0.61896, throughput: 312.91 | 2022-04-11 04:38:21.792 [rank:4] [train], epoch: 25/50, iter: 500/834, loss: 0.31789, lr: 0.739077, top1: 0.61422, throughput: 313.17 | 2022-04-11 04:38:21.798 [rank:3] [train], epoch: 25/50, iter: 500/834, loss: 0.31596, lr: 0.739077, top1: 0.61531, throughput: 312.73 | 2022-04-11 04:38:21.804 [rank:1] [train], epoch: 25/50, iter: 500/834, loss: 0.31579, lr: 0.739077, top1: 0.61896, throughput: 312.99 | 2022-04-11 04:38:21.828 [rank:0] [train], epoch: 25/50, iter: 500/834, loss: 0.31874, lr: 0.739077, top1: 0.61276, throughput: 312.74 | 2022-04-11 04:38:21.835 [rank:7] [train], epoch: 25/50, iter: 500/834, loss: 0.31584, lr: 0.739077, top1: 0.61760, throughput: 312.62 | 2022-04-11 04:38:21.843 [rank:2] [train], epoch: 25/50, iter: 500/834, loss: 0.31682, lr: 0.739077, top1: 0.61990, throughput: 312.59 | 2022-04-11 04:38:21.851 [rank:6] [train], epoch: 25/50, iter: 500/834, loss: 0.31525, lr: 0.739077, top1: 0.62354, throughput: 312.91 | 2022-04-11 04:38:21.871 [rank:0] [train], epoch: 25/50, iter: 600/834, loss: 0.31741, lr: 0.733296, top1: 0.61802, throughput: 313.86 | 2022-04-11 04:39:23.010 [rank:5] [train], epoch: 25/50, iter: 600/834, loss: 0.31410, lr: 0.733296, top1: 0.62177, throughput: 313.55 | 2022-04-11 04:39:23.026 [rank:7] [train], epoch: 25/50, iter: 600/834, loss: 0.31680, lr: 0.733296, top1: 0.61557, throughput: 313.76 | 2022-04-11 04:39:23.037 [rank:4] [train], epoch: 25/50, iter: 600/834, loss: 0.31569, lr: 0.733296, top1: 0.62214, throughput: 313.49 | 2022-04-11 04:39:23.045 [rank:6] [train], epoch: 25/50, iter: 600/834, loss: 0.31698, lr: 0.733296, top1: 0.61437, throughput: 313.72 | 2022-04-11 04:39:23.072 [rank:3] [train], epoch: 25/50, iter: 600/834, loss: 0.31566, lr: 0.733296, top1: 0.61714, throughput: 313.37 | 2022-04-11 04:39:23.074 [rank:1] [train], epoch: 25/50, iter: 600/834, loss: 0.31557, lr: 0.733296, top1: 0.61880, throughput: 313.39 | 2022-04-11 04:39:23.093 [rank:2] [train], epoch: 25/50, iter: 600/834, loss: 0.31576, lr: 0.733296, top1: 0.61792, throughput: 313.48 | 2022-04-11 04:39:23.099 [rank:5] [train], epoch: 25/50, iter: 700/834, loss: 0.31754, lr: 0.727517, top1: 0.61526, throughput: 312.56 | 2022-04-11 04:40:24.455 [rank:4] [train], epoch: 25/50, iter: 700/834, loss: 0.31745, lr: 0.727517, top1: 0.61891, throughput: 312.61 | 2022-04-11 04:40:24.463 [rank:0] [train], epoch: 25/50, iter: 700/834, loss: 0.31712, lr: 0.727517, top1: 0.61401, throughput: 312.41 | 2022-04-11 04:40:24.467 [rank:3] [train], epoch: 25/50, iter: 700/834, loss: 0.31778, lr: 0.727517, top1: 0.61979, throughput: 312.69 | 2022-04-11 04:40:24.477 [rank:6] [train], epoch: 25/50, iter: 700/834, loss: 0.31522, lr: 0.727517, top1: 0.61865, throughput: 312.53 | 2022-04-11 04:40:24.506 [rank:2] [train], epoch: 25/50, iter: 700/834, loss: 0.31721, lr: 0.727517, top1: 0.61859, throughput: 312.64 | 2022-04-11 04:40:24.511 [rank:7] [train], epoch: 25/50, iter: 700/834, loss: 0.31947, lr: 0.727517, top1: 0.61453, throughput: 312.30 | 2022-04-11 04:40:24.516 [rank:1] [train], epoch: 25/50, iter: 700/834, loss: 0.31540, lr: 0.727517, top1: 0.62104, throughput: 312.54 | 2022-04-11 04:40:24.525 [rank:1] [train], epoch: 25/50, iter: 800/834, loss: 0.31636, lr: 0.721740, top1: 0.61672, throughput: 314.58 | 2022-04-11 04:41:25.559 [rank:5] [train], epoch: 25/50, iter: 800/834, loss: 0.31474, lr: 0.721740, top1: 0.61724, throughput: 314.22 | 2022-04-11 04:41:25.559 [rank:4] [train], epoch: 25/50, iter: 800/834, loss: 0.31572, lr: 0.721740, top1: 0.61682, throughput: 314.24 | 2022-04-11 04:41:25.564 [rank:0] [train], epoch: 25/50, iter: 800/834, loss: 0.31861, lr: 0.721740, top1: 0.60948, throughput: 314.17 | 2022-04-11 04:41:25.581 [rank:2] [train], epoch: 25/50, iter: 800/834, loss: 0.31862, lr: 0.721740, top1: 0.61286, throughput: 314.30 | 2022-04-11 04:41:25.599 [rank:7] [train], epoch: 25/50, iter: 800/834, loss: 0.31764, lr: 0.721740, top1: 0.61682, throughput: 314.32 | 2022-04-11 04:41:25.600 [rank:6] [train], epoch: 25/50, iter: 800/834, loss: 0.31607, lr: 0.721740, top1: 0.61698, throughput: 314.27 | 2022-04-11 04:41:25.601 [rank:3] [train], epoch: 25/50, iter: 800/834, loss: 0.31579, lr: 0.721740, top1: 0.61854, throughput: 314.49 | 2022-04-11 04:41:25.527 [rank:5] [train], epoch: 25/50, iter: 834/834, loss: 0.31525, lr: 0.719777, top1: 0.62301, throughput: 312.00 | 2022-04-11 04:41:46.482 [rank:4] [train], epoch: 25/50, iter: 834/834, loss: 0.31430, lr: 0.719777, top1: 0.62331, throughput: 312.05 | 2022-04-11 04:41:46.483 [rank:1] [train], epoch: 25/50, iter: 834/834, loss: 0.31801, lr: 0.719777, top1: 0.61259, throughput: 311.84 | 2022-04-11 04:41:46.492 [rank:6] [train], epoch: 25/50, iter: 834/834, loss: 0.31684, lr: 0.719777, top1: 0.61550, throughput: 312.44 | 2022-04-11 04:41:46.494 [rank:3] [train], epoch: 25/50, iter: 834/834, loss: 0.31793, lr: 0.719777, top1: 0.61673, throughput: 311.34[rank:7] [train], epoch: 25/50, iter: 834/834, loss: 0.31509, lr: 0.719777, top1: 0.61749, throughput: 312.41 | 2022-04-11 04:41:46.496 | 2022-04-11 04:41:46.495 [rank:0] [train], epoch: 25/50, iter: 834/834, loss: 0.31146, lr: 0.719777, top1: 0.62393, throughput: 312.09 | 2022-04-11 04:41:46.498 [rank:2] [train], epoch: 25/50, iter: 834/834, loss: 0.31461, lr: 0.719777, top1: 0.62224, throughput: 311.87 | 2022-04-11 04:41:46.530 [rank:0] [eval], epoch: 25/50, iter: 125/125, loss: 0.00000, lr: 0.719777, top1: 0.65072, throughput: 488.48 | 2022-04-11 04:41:59.293 [rank:2] [eval], epoch: 25/50, iter: 125/125, loss: 0.00000, lr: 0.719777, top1: 0.62896, throughput: 489.49 | 2022-04-11 04:41:59.299 [rank:1] [eval], epoch: 25/50, iter: 125/125, loss: 0.00000, lr: 0.719777, top1: 0.64784, throughput: 487.95 | 2022-04-11 04:41:59.301 [rank:6] [eval], epoch: 25/50, iter: 125/125, loss: 0.00000, lr: 0.719777, top1: 0.64384, throughput: 487.75 | 2022-04-11 04:41:59.308 [rank:3] [eval], epoch: 25/50, iter: 125/125, loss: 0.00000, lr: 0.719777, top1: 0.63648, throughput: 487.70 | 2022-04-11 04:41:59.310 [rank:7] [eval], epoch: 25/50, iter: 125/125, loss: 0.00000, lr: 0.719777, top1: 0.64416, throughput: 487.63 | 2022-04-11 04:41:59.313 [rank:4] [eval], epoch: 25/50, iter: 125/125, loss: 0.00000, lr: 0.719777, top1: 0.62960, throughput: 487.17 | 2022-04-11 04:41:59.313 [rank:5] [eval], epoch: 25/50, iter: 125/125, loss: 0.00000, lr: 0.719777, top1: 0.62928, throughput: 485.74 | 2022-04-11 04:41:59.349 [rank:2] [train], epoch: 26/50, iter: 100/834, loss: 0.31253, lr: 0.714004, top1: 0.62641, throughput: 313.14 | 2022-04-11 04:43:00.613 [rank:6] [train], epoch: 26/50, iter: 100/834, loss: 0.31486, lr: 0.714004, top1: 0.62031, throughput: 313.12 | 2022-04-11 04:43:00.626 [rank:4] [train], epoch: 26/50, iter: 100/834, loss: 0.31050, lr: 0.714004, top1: 0.62865, throughput: 313.05 | 2022-04-11 04:43:00.644 [rank:3] [train], epoch: 26/50, iter: 100/834, loss: 0.31026, lr: 0.714004, top1: 0.63370, throughput: 312.97 | 2022-04-11 04:43:00.658 [rank:0] [train], epoch: 26/50, iter: 100/834, loss: 0.30753, lr: 0.714004, top1: 0.63781, throughput: 312.87 | 2022-04-11 04:43:00.660 [rank:1] [train], epoch: 26/50, iter: 100/834, loss: 0.31149, lr: 0.714004, top1: 0.62802, throughput: 312.90 | 2022-04-11 04:43:00.663 [rank:7] [train], epoch: 26/50, iter: 100/834, loss: 0.30969, lr: 0.714004, top1: 0.63339, throughput: 312.95 | 2022-04-11 04:43:00.664 [rank:5] [train], epoch: 26/50, iter: 100/834, loss: 0.30928, lr: 0.714004, top1: 0.63240, throughput: 313.07 | 2022-04-11 04:43:00.677 [rank:2] [train], epoch: 26/50, iter: 200/834, loss: 0.31107, lr: 0.708234, top1: 0.63083, throughput: 313.70 | 2022-04-11 04:44:01.817 [rank:3] [train], epoch: 26/50, iter: 200/834, loss: 0.31055, lr: 0.708234, top1: 0.62964, throughput: 313.75 | 2022-04-11 04:44:01.853 [rank:7] [train], epoch: 26/50, iter: 200/834, loss: 0.30939, lr: 0.708234, top1: 0.63135, throughput: 313.77[rank:4] [train], epoch: 26/50, iter: 200/834, loss: 0.31271, lr: 0.708234, top1: 0.62943, throughput: 313.66 | 2022-04-11 04:44:01.856 | 2022-04-11 04:44:01.856 [rank:6] [train], epoch: 26/50, iter: 200/834, loss: 0.31063, lr: 0.708234, top1: 0.63146, throughput: 313.57 | 2022-04-11 04:44:01.857 [rank:1] [train], epoch: 26/50, iter: 200/834, loss: 0.31103, lr: 0.708234, top1: 0.62823, throughput: 313.75 | 2022-04-11 04:44:01.858 [rank:5] [train], epoch: 26/50, iter: 200/834, loss: 0.31339, lr: 0.708234, top1: 0.62547, throughput: 313.82 | 2022-04-11 04:44:01.859 [rank:0] [train], epoch: 26/50, iter: 200/834, loss: 0.31046, lr: 0.708234, top1: 0.63229, throughput: 313.72 | 2022-04-11 04:44:01.862 [rank:4] [train], epoch: 26/50, iter: 300/834, loss: 0.31409, lr: 0.702467, top1: 0.62536, throughput: 312.25 | 2022-04-11 04:45:03.345 [rank:6] [train], epoch: 26/50, iter: 300/834, loss: 0.31234, lr: 0.702467, top1: 0.62521, throughput: 312.05 | 2022-04-11 04:45:03.386 [rank:5] [train], epoch: 26/50, iter: 300/834, loss: 0.30844, lr: 0.702467, top1: 0.63302, throughput: 312.00 | 2022-04-11 04:45:03.398 [rank:2] [train], epoch: 26/50, iter: 300/834, loss: 0.31118, lr: 0.702467, top1: 0.63031, throughput: 311.76 | 2022-04-11 04:45:03.403 [rank:3] [train], epoch: 26/50, iter: 300/834, loss: 0.31389, lr: 0.702467, top1: 0.62448, throughput: 311.70 | 2022-04-11 04:45:03.450 [rank:7] [train], epoch: 26/50, iter: 300/834, loss: 0.31256, lr: 0.702467, top1: 0.62542, throughput: 311.66 | 2022-04-11 04:45:03.461 [rank:0] [train], epoch: 26/50, iter: 300/834, loss: 0.31293, lr: 0.702467, top1: 0.62370, throughput: 311.61 | 2022-04-11 04:45:03.478 [rank:1] [train], epoch: 26/50, iter: 300/834, loss: 0.31318, lr: 0.702467, top1: 0.62687, throughput: 311.98 | 2022-04-11 04:45:03.400 [rank:4] [train], epoch: 26/50, iter: 400/834, loss: 0.31369, lr: 0.696704, top1: 0.62422, throughput: 313.56 | 2022-04-11 04:46:04.577 [rank:2] [train], epoch: 26/50, iter: 400/834, loss: 0.31282, lr: 0.696704, top1: 0.62427, throughput: 313.80 | 2022-04-11 04:46:04.589 [rank:5] [train], epoch: 26/50, iter: 400/834, loss: 0.31603, lr: 0.696704, top1: 0.62094, throughput: 313.77 | 2022-04-11 04:46:04.589 [rank:1] [train], epoch: 26/50, iter: 400/834, loss: 0.31117, lr: 0.696704, top1: 0.63125, throughput: 313.77 | 2022-04-11 04:46:04.592 [rank:7] [train], epoch: 26/50, iter: 400/834, loss: 0.31373, lr: 0.696704, top1: 0.62625, throughput: 314.00 | 2022-04-11 04:46:04.608 [rank:6] [train], epoch: 26/50, iter: 400/834, loss: 0.31119, lr: 0.696704, top1: 0.63156, throughput: 313.56 | 2022-04-11 04:46:04.618 [rank:3] [train], epoch: 26/50, iter: 400/834, loss: 0.31541, lr: 0.696704, top1: 0.61766, throughput: 314.24 | 2022-04-11 04:46:04.551 [rank:0] [train], epoch: 26/50, iter: 400/834, loss: 0.31568, lr: 0.696704, top1: 0.61891, throughput: 313.96 | 2022-04-11 04:46:04.633 [rank:7] [train], epoch: 26/50, iter: 500/834, loss: 0.31422, lr: 0.690945, top1: 0.62068, throughput: 311.65 | 2022-04-11 04:47:06.215 [rank:2] [train], epoch: 26/50, iter: 500/834, loss: 0.31264, lr: 0.690945, top1: 0.62599, throughput: 311.32 | 2022-04-11 04:47:06.262 [rank:6] [train], epoch: 26/50, iter: 500/834, loss: 0.31216, lr: 0.690945, top1: 0.62484, throughput: 311.45 | 2022-04-11 04:47:06.264 [rank:1] [train], epoch: 26/50, iter: 500/834, loss: 0.31718, lr: 0.690945, top1: 0.61880, throughput: 311.27 | 2022-04-11 04:47:06.275 [rank:3] [train], epoch: 26/50, iter: 500/834, loss: 0.31161, lr: 0.690945, top1: 0.62823, throughput: 310.97 | 2022-04-11 04:47:06.294 [rank:4] [train], epoch: 26/50, iter: 500/834, loss: 0.31119, lr: 0.690945, top1: 0.63286, throughput: 311.06 | 2022-04-11 04:47:06.301 [rank:5] [train], epoch: 26/50, iter: 500/834, loss: 0.31417, lr: 0.690945, top1: 0.61937, throughput: 311.11 | 2022-04-11 04:47:06.303 [rank:0] [train], epoch: 26/50, iter: 500/834, loss: 0.30876, lr: 0.690945, top1: 0.62911, throughput: 311.26 | 2022-04-11 04:47:06.318 [rank:5] [train], epoch: 26/50, iter: 600/834, loss: 0.31189, lr: 0.685191, top1: 0.62828, throughput: 312.83 | 2022-04-11 04:48:07.680 [rank:4] [train], epoch: 26/50, iter: 600/834, loss: 0.31029, lr: 0.685191, top1: 0.62589, throughput: 312.66 | 2022-04-11 04:48:07.710 [rank:0] [train], epoch: 26/50, iter: 600/834, loss: 0.31493, lr: 0.685191, top1: 0.62161, throughput: 312.69 | 2022-04-11 04:48:07.720 [rank:6] [train], epoch: 26/50, iter: 600/834, loss: 0.31634, lr: 0.685191, top1: 0.62021, throughput: 312.41 | 2022-04-11 04:48:07.722 [rank:2] [train], epoch: 26/50, iter: 600/834, loss: 0.31435, lr: 0.685191, top1: 0.62432, throughput: 312.27 | 2022-04-11 04:48:07.747 [rank:3] [train], epoch: 26/50, iter: 600/834, loss: 0.31140, lr: 0.685191, top1: 0.62833, throughput: 312.41 | 2022-04-11 04:48:07.751 [rank:7] [train], epoch: 26/50, iter: 600/834, loss: 0.31260, lr: 0.685191, top1: 0.62964, throughput: 311.97 | 2022-04-11 04:48:07.759 [rank:1] [train], epoch: 26/50, iter: 600/834, loss: 0.31631, lr: 0.685191, top1: 0.62187, throughput: 312.19 | 2022-04-11 04:48:07.776 [rank:1] [train], epoch: 26/50, iter: 700/834, loss: 0.31438, lr: 0.679441, top1: 0.62344, throughput: 313.66 | 2022-04-11 04:49:08.989 [rank:4] [train], epoch: 26/50, iter: 700/834, loss: 0.31097, lr: 0.679441, top1: 0.62510, throughput: 313.22 | 2022-04-11 04:49:09.009 [rank:3] [train], epoch: 26/50, iter: 700/834, loss: 0.31188, lr: 0.679441, top1: 0.62651, throughput: 313.36 | 2022-04-11 04:49:09.023 [rank:5] [train], epoch: 26/50, iter: 700/834, loss: 0.31371, lr: 0.679441, top1: 0.62297, throughput: 312.97 | 2022-04-11 04:49:09.028 [rank:2] [train], epoch: 26/50, iter: 700/834, loss: 0.31475, lr: 0.679441, top1: 0.62328, throughput: 313.31 | 2022-04-11 04:49:09.029 [rank:0] [train], epoch: 26/50, iter: 700/834, loss: 0.31593, lr: 0.679441, top1: 0.62036, throughput: 313.15 | 2022-04-11 04:49:09.033 [rank:7] [train], epoch: 26/50, iter: 700/834, loss: 0.31302, lr: 0.679441, top1: 0.62505, throughput: 313.24 | 2022-04-11 04:49:09.054 [rank:6] [train], epoch: 26/50, iter: 700/834, loss: 0.31346, lr: 0.679441, top1: 0.62406, throughput: 312.99 | 2022-04-11 04:49:09.065 [rank:4] [train], epoch: 26/50, iter: 800/834, loss: 0.31297, lr: 0.673696, top1: 0.62578, throughput: 312.66 | 2022-04-11 04:50:10.418 [rank:2] [train], epoch: 26/50, iter: 800/834, loss: 0.31393, lr: 0.673696, top1: 0.62099, throughput: 312.57 | 2022-04-11 04:50:10.456 [rank:5] [train], epoch: 26/50, iter: 800/834, loss: 0.31390, lr: 0.673696, top1: 0.62292, throughput: 312.45 | 2022-04-11 04:50:10.478 [rank:0] [train], epoch: 26/50, iter: 800/834, loss: 0.31414, lr: 0.673696, top1: 0.62266, throughput: 312.30 | 2022-04-11 04:50:10.511 [rank:6] [train], epoch: 26/50, iter: 800/834, loss: 0.31443, lr: 0.673696, top1: 0.62422, throughput: 312.45 | 2022-04-11 04:50:10.515 [rank:1] [train], epoch: 26/50, iter: 800/834, loss: 0.31528, lr: 0.673696, top1: 0.61937, throughput: 312.05 | 2022-04-11 04:50:10.517 [rank:7] [train], epoch: 26/50, iter: 800/834, loss: 0.31477, lr: 0.673696, top1: 0.62323, throughput: 312.30 | 2022-04-11 04:50:10.533 [rank:3] [train], epoch: 26/50, iter: 800/834, loss: 0.31432, lr: 0.673696, top1: 0.62089, throughput: 312.12 | 2022-04-11 04:50:10.538 [rank:2] [train], epoch: 26/50, iter: 834/834, loss: 0.31080, lr: 0.671744, top1: 0.63557, throughput: 312.40 | 2022-04-11 04:50:31.352 [rank:4] [train], epoch: 26/50, iter: 834/834, loss: 0.31482, lr: 0.671744, top1: 0.62270, throughput: 311.80 | 2022-04-11 04:50:31.355 [rank:5] [train], epoch: 26/50, iter: 834/834, loss: 0.31507, lr: 0.671744, top1: 0.62040, throughput: 312.68 | 2022-04-11 04:50:31.355 [rank:7] [train], epoch: 26/50, iter: 834/834, loss: 0.31303, lr: 0.671744, top1: 0.62837, throughput: 313.48 | 2022-04-11 04:50:31.357 [rank:0] [train], epoch: 26/50, iter: 834/834, loss: 0.31374, lr: 0.671744, top1: 0.62132, throughput: 313.04 | 2022-04-11 04:50:31.365 [rank:1] [train], epoch: 26/50, iter: 834/834, loss: 0.31388, lr: 0.671744, top1: 0.62117, throughput: 312.69 | 2022-04-11 04:50:31.394 [rank:6] [train], epoch: 26/50, iter: 834/834, loss: 0.31574, lr: 0.671744, top1: 0.62270, throughput: 312.64 | 2022-04-11 04:50:31.395 [rank:3] [train], epoch: 26/50, iter: 834/834, loss: 0.31407, lr: 0.671744, top1: 0.61826, throughput: 312.92 | 2022-04-11 04:50:31.400 [rank:0] [eval], epoch: 26/50, iter: 125/125, loss: 0.00000, lr: 0.671744, top1: 0.64288, throughput: 482.14 | 2022-04-11 04:50:44.328 [rank:1] [eval], epoch: 26/50, iter: 125/125, loss: 0.00000, lr: 0.671744, top1: 0.63216, throughput: 483.14 | 2022-04-11 04:50:44.331 [rank:2] [eval], epoch: 26/50, iter: 125/125, loss: 0.00000, lr: 0.671744, top1: 0.63056, throughput: 481.30 | 2022-04-11 04:50:44.338 [rank:3] [eval], epoch: 26/50, iter: 125/125, loss: 0.00000, lr: 0.671744, top1: 0.62288, throughput: 482.77 | 2022-04-11 04:50:44.346 [rank:7] [eval], epoch: 26/50, iter: 125/125, loss: 0.00000, lr: 0.671744, top1: 0.63952, throughput: 480.89 | 2022-04-11 04:50:44.353 [rank:6] [eval], epoch: 26/50, iter: 125/125, loss: 0.00000, lr: 0.671744, top1: 0.62880, throughput: 481.63 | 2022-04-11 04:50:44.372 [rank:4] [eval], epoch: 26/50, iter: 125/125, loss: 0.00000, lr: 0.671744, top1: 0.63280, throughput: 478.87 | 2022-04-11 04:50:44.406 [rank:5] [eval], epoch: 26/50, iter: 125/125, loss: 0.00000, lr: 0.671744, top1: 0.62672, throughput: 477.80 | 2022-04-11 04:50:44.436 [rank:0] [train], epoch: 27/50, iter: 100/834, loss: 0.31325, lr: 0.666007, top1: 0.62141, throughput: 313.05 | 2022-04-11 04:51:45.659 [rank:4] [train], epoch: 27/50, iter: 100/834, loss: 0.30927, lr: 0.666007, top1: 0.63182, throughput: 313.29 | 2022-04-11 04:51:45.692 [rank:1] [train], epoch: 27/50, iter: 100/834, loss: 0.30927, lr: 0.666007, top1: 0.63229, throughput: 312.89 | 2022-04-11 04:51:45.694 [rank:2] [train], epoch: 27/50, iter: 100/834, loss: 0.30784, lr: 0.666007, top1: 0.63260, throughput: 312.91 | 2022-04-11 04:51:45.697 [rank:7] [train], epoch: 27/50, iter: 100/834, loss: 0.30452, lr: 0.666007, top1: 0.64224, throughput: 312.96 | 2022-04-11 04:51:45.704 [rank:6] [train], epoch: 27/50, iter: 100/834, loss: 0.30526, lr: 0.666007, top1: 0.64146, throughput: 313.05 | 2022-04-11 04:51:45.704 [rank:3] [train], epoch: 27/50, iter: 100/834, loss: 0.30258, lr: 0.666007, top1: 0.64740, throughput: 312.91 | 2022-04-11 04:51:45.705 [rank:5] [train], epoch: 27/50, iter: 100/834, loss: 0.30946, lr: 0.666007, top1: 0.62922, throughput: 313.35 | 2022-04-11 04:51:45.709 [rank:1] [train], epoch: 27/50, iter: 200/834, loss: 0.30675, lr: 0.660275, top1: 0.63521, throughput: 314.39 | 2022-04-11 04:52:46.764 [rank:4] [train], epoch: 27/50, iter: 200/834, loss: 0.30762, lr: 0.660275, top1: 0.63422, throughput: 314.31 | 2022-04-11 04:52:46.779 [rank:6] [train], epoch: 27/50, iter: 200/834, loss: 0.30991, lr: 0.660275, top1: 0.62865, throughput: 314.33 | 2022-04-11 04:52:46.787 [rank:2] [train], epoch: 27/50, iter: 200/834, loss: 0.31130, lr: 0.660275, top1: 0.63464, throughput: 314.28 | 2022-04-11 04:52:46.789 [rank:3] [train], epoch: 27/50, iter: 200/834, loss: 0.31062, lr: 0.660275, top1: 0.62776, throughput: 314.30 | 2022-04-11 04:52:46.793 [rank:7] [train], epoch: 27/50, iter: 200/834, loss: 0.30680, lr: 0.660275, top1: 0.63828, throughput: 314.24 | 2022-04-11 04:52:46.803 [rank:0] [train], epoch: 27/50, iter: 200/834, loss: 0.30505, lr: 0.660275, top1: 0.64411, throughput: 314.33 | 2022-04-11 04:52:46.741 [rank:5] [train], epoch: 27/50, iter: 200/834, loss: 0.30808, lr: 0.660275, top1: 0.63677, throughput: 314.01 | 2022-04-11 04:52:46.854 [rank:4] [train], epoch: 27/50, iter: 300/834, loss: 0.30793, lr: 0.654549, top1: 0.62958, throughput: 313.42 | 2022-04-11 04:53:48.039 [rank:5] [train], epoch: 27/50, iter: 300/834, loss: 0.30856, lr: 0.654549, top1: 0.63313, throughput: 313.68 | 2022-04-11 04:53:48.063 [rank:1] [train], epoch: 27/50, iter: 300/834, loss: 0.30957, lr: 0.654549, top1: 0.63328, throughput: 313.20 | 2022-04-11 04:53:48.066 [rank:0] [train], epoch: 27/50, iter: 300/834, loss: 0.31173, lr: 0.654549, top1: 0.62542, throughput: 313.04 | 2022-04-11 04:53:48.075 [rank:7] [train], epoch: 27/50, iter: 300/834, loss: 0.30717, lr: 0.654549, top1: 0.63516, throughput: 313.32 | 2022-04-11 04:53:48.082 [rank:2] [train], epoch: 27/50, iter: 300/834, loss: 0.30712, lr: 0.654549, top1: 0.64068, throughput: 313.65 | 2022-04-11 04:53:48.004 [rank:3] [train], epoch: 27/50, iter: 300/834, loss: 0.31009, lr: 0.654549, top1: 0.63333, throughput: 313.20 | 2022-04-11 04:53:48.095 [rank:6] [train], epoch: 27/50, iter: 300/834, loss: 0.31118, lr: 0.654549, top1: 0.63068, throughput: 313.16 | 2022-04-11 04:53:48.098 [rank:5] [train], epoch: 27/50, iter: 400/834, loss: 0.30980, lr: 0.648830, top1: 0.63057, throughput: 312.45 | 2022-04-11 04:54:49.513 [rank:4] [train], epoch: 27/50, iter: 400/834, loss: 0.31049, lr: 0.648830, top1: 0.63047, throughput: 312.29 | 2022-04-11 04:54:49.521 [rank:6] [train], epoch: 27/50, iter: 400/834, loss: 0.30694, lr: 0.648830, top1: 0.63672, throughput: 312.45 | 2022-04-11 04:54:49.547 [rank:3] [train], epoch: 27/50, iter: 400/834, loss: 0.31002, lr: 0.648830, top1: 0.63151, throughput: 312.43 | 2022-04-11 04:54:49.549 [rank:0] [train], epoch: 27/50, iter: 400/834, loss: 0.31077, lr: 0.648830, top1: 0.62604, throughput: 312.30 | 2022-04-11 04:54:49.553 [rank:2] [train], epoch: 27/50, iter: 400/834, loss: 0.30833, lr: 0.648830, top1: 0.63245, throughput: 311.94 | 2022-04-11 04:54:49.554 [rank:1] [train], epoch: 27/50, iter: 400/834, loss: 0.30802, lr: 0.648830, top1: 0.63458, throughput: 312.53 | 2022-04-11 04:54:49.500 [rank:7] [train], epoch: 27/50, iter: 400/834, loss: 0.30909, lr: 0.648830, top1: 0.63203, throughput: 312.20 | 2022-04-11 04:54:49.580 [rank:2] [train], epoch: 27/50, iter: 500/834, loss: 0.30943, lr: 0.643117, top1: 0.63078, throughput: 313.51 | 2022-04-11 04:55:50.795 [rank:7] [train], epoch: 27/50, iter: 500/834, loss: 0.30860, lr: 0.643117, top1: 0.63005, throughput: 313.52 | 2022-04-11 04:55:50.821 [rank:3] [train], epoch: 27/50, iter: 500/834, loss: 0.31260, lr: 0.643117, top1: 0.62563, throughput: 313.24 | 2022-04-11 04:55:50.844 [rank:5] [train], epoch: 27/50, iter: 500/834, loss: 0.31096, lr: 0.643117, top1: 0.62776, throughput: 313.05 | 2022-04-11 04:55:50.845 [rank:6] [train], epoch: 27/50, iter: 500/834, loss: 0.30812, lr: 0.643117, top1: 0.63078, throughput: 313.51 | 2022-04-11 04:55:50.788 [rank:4] [train], epoch: 27/50, iter: 500/834, loss: 0.30922, lr: 0.643117, top1: 0.63172, throughput: 312.91 | 2022-04-11 04:55:50.881 [rank:1] [train], epoch: 27/50, iter: 500/834, loss: 0.31123, lr: 0.643117, top1: 0.62776, throughput: 313.27 | 2022-04-11 04:55:50.790 [rank:0] [train], epoch: 27/50, iter: 500/834, loss: 0.30937, lr: 0.643117, top1: 0.63161, throughput: 313.50 | 2022-04-11 04:55:50.797 [rank:0] [train], epoch: 27/50, iter: 600/834, loss: 0.31110, lr: 0.637412, top1: 0.63125, throughput: 312.20 | 2022-04-11 04:56:52.296 [rank:3] [train], epoch: 27/50, iter: 600/834, loss: 0.31057, lr: 0.637412, top1: 0.62724, throughput: 312.38 | 2022-04-11 04:56:52.308 [rank:1] [train], epoch: 27/50, iter: 600/834, loss: 0.31165, lr: 0.637412, top1: 0.62599, throughput: 312.03 | 2022-04-11 04:56:52.322 [rank:6] [train], epoch: 27/50, iter: 600/834, loss: 0.30997, lr: 0.637412, top1: 0.62922, throughput: 312.00 | 2022-04-11 04:56:52.326 [rank:7] [train], epoch: 27/50, iter: 600/834, loss: 0.31103, lr: 0.637412, top1: 0.63224, throughput: 312.08 | 2022-04-11 04:56:52.344 [rank:4] [train], epoch: 27/50, iter: 600/834, loss: 0.31259, lr: 0.637412, top1: 0.62901, throughput: 312.30 | 2022-04-11 04:56:52.361 [rank:5] [train], epoch: 27/50, iter: 600/834, loss: 0.31065, lr: 0.637412, top1: 0.62823, throughput: 312.42 | 2022-04-11 04:56:52.301 [rank:2] [train], epoch: 27/50, iter: 600/834, loss: 0.30844, lr: 0.637412, top1: 0.63422, throughput: 311.65 | 2022-04-11 04:56:52.402 [rank:0] [train], epoch: 27/50, iter: 700/834, loss: 0.30888, lr: 0.631714, top1: 0.63073, throughput: 312.82 | 2022-04-11 04:57:53.673 [rank:7] [train], epoch: 27/50, iter: 700/834, loss: 0.30876, lr: 0.631714, top1: 0.62974, throughput: 312.97 | 2022-04-11 04:57:53.691 [rank:6] [train], epoch: 27/50, iter: 700/834, loss: 0.31201, lr: 0.631714, top1: 0.62891, throughput: 312.84 | 2022-04-11 04:57:53.700 [rank:5] [train], epoch: 27/50, iter: 700/834, loss: 0.30791, lr: 0.631714, top1: 0.63484, throughput: 312.68 | 2022-04-11 04:57:53.707 [rank:4] [train], epoch: 27/50, iter: 700/834, loss: 0.31048, lr: 0.631714, top1: 0.62828, throughput: 312.95 | 2022-04-11 04:57:53.713 [rank:2] [train], epoch: 27/50, iter: 700/834, loss: 0.30814, lr: 0.631714, top1: 0.63750, throughput: 313.15 | 2022-04-11 04:57:53.714 [rank:1] [train], epoch: 27/50, iter: 700/834, loss: 0.31220, lr: 0.631714, top1: 0.62865, throughput: 312.71 | 2022-04-11 04:57:53.721 [rank:3] [train], epoch: 27/50, iter: 700/834, loss: 0.30933, lr: 0.631714, top1: 0.63333, throughput: 312.93 | 2022-04-11 04:57:53.664 [rank:4] [train], epoch: 27/50, iter: 800/834, loss: 0.31052, lr: 0.626024, top1: 0.62828, throughput: 311.87 | 2022-04-11 04:58:55.278 [rank:6] [train], epoch: 27/50, iter: 800/834, loss: 0.30996, lr: 0.626024, top1: 0.63057, throughput: 311.80 | 2022-04-11 04:58:55.278 [rank:5] [train], epoch: 27/50, iter: 800/834, loss: 0.31155, lr: 0.626024, top1: 0.62682, throughput: 311.82 | 2022-04-11 04:58:55.282 [rank:3] [train], epoch: 27/50, iter: 800/834, loss: 0.31233, lr: 0.626024, top1: 0.62464, throughput: 311.55 | 2022-04-11 04:58:55.291 [rank:2] [train], epoch: 27/50, iter: 800/834, loss: 0.31101, lr: 0.626024, top1: 0.63000, throughput: 311.59 | 2022-04-11 04:58:55.333 [rank:1] [train], epoch: 27/50, iter: 800/834, loss: 0.31180, lr: 0.626024, top1: 0.62573, throughput: 311.59 | 2022-04-11 04:58:55.341 [rank:0] [train], epoch: 27/50, iter: 800/834, loss: 0.30948, lr: 0.626024, top1: 0.63073, throughput: 311.32 | 2022-04-11 04:58:55.346 [rank:7] [train], epoch: 27/50, iter: 800/834, loss: 0.30918, lr: 0.626024, top1: 0.63229, throughput: 311.29 | 2022-04-11 04:58:55.370 [rank:0] [train], epoch: 27/50, iter: 834/834, loss: 0.30914, lr: 0.624091, top1: 0.62822, throughput: 311.96 | 2022-04-11 04:59:16.272 [rank:5] [train], epoch: 27/50, iter: 834/834, loss: 0.30623, lr: 0.624091, top1: 0.64323, throughput: 310.83 | 2022-04-11 04:59:16.283 [rank:2] [train], epoch: 27/50, iter: 834/834, loss: 0.30975, lr: 0.624091, top1: 0.62699, throughput: 311.43 | 2022-04-11 04:59:16.294 [rank:6] [train], epoch: 27/50, iter: 834/834, loss: 0.31059, lr: 0.624091, top1: 0.63097, throughput: 310.60 | 2022-04-11 04:59:16.296 [rank:7] [train], epoch: 27/50, iter: 834/834, loss: 0.31265, lr: 0.624091, top1: 0.62822, throughput: 311.85 | 2022-04-11 04:59:16.303 [rank:1] [train], epoch: 27/50, iter: 834/834, loss: 0.31276, lr: 0.624091, top1: 0.62255, throughput: 311.37 | 2022-04-11 04:59:16.306 [rank:3] [train], epoch: 27/50, iter: 834/834, loss: 0.30873, lr: 0.624091, top1: 0.63955, throughput: 310.61 | 2022-04-11 04:59:16.308 [rank:4] [train], epoch: 27/50, iter: 834/834, loss: 0.31071, lr: 0.624091, top1: 0.63082, throughput: 310.04 | 2022-04-11 04:59:16.333 [rank:0] [eval], epoch: 27/50, iter: 125/125, loss: 0.00000, lr: 0.624091, top1: 0.65264, throughput: 483.98[rank:1] [eval], epoch: 27/50, iter: 125/125, loss: 0.00000, lr: 0.624091, top1: 0.65104, throughput: 485.26 | 2022-04-11 04:59:29.186| 2022-04-11 04:59:29.185 [rank:2] [eval], epoch: 27/50, iter: 125/125, loss: 0.00000, lr: 0.624091, top1: 0.63920, throughput: 484.63 | 2022-04-11 04:59:29.190 [rank:3] [eval], epoch: 27/50, iter: 125/125, loss: 0.00000, lr: 0.624091, top1: 0.63984, throughput: 485.08 | 2022-04-11 04:59:29.192 [rank:5] [eval], epoch: 27/50, iter: 125/125, loss: 0.00000, lr: 0.624091, top1: 0.63968, throughput: 483.56 | 2022-04-11 04:59:29.208 [rank:7] [eval], epoch: 27/50, iter: 125/125, loss: 0.00000, lr: 0.624091, top1: 0.64640, throughput: 484.24 | 2022-04-11 04:59:29.210 [rank:6] [eval], epoch: 27/50, iter: 125/125, loss: 0.00000, lr: 0.624091, top1: 0.64032, throughput: 483.55 | 2022-04-11 04:59:29.221 [rank:4] [eval], epoch: 27/50, iter: 125/125, loss: 0.00000, lr: 0.624091, top1: 0.64320, throughput: 484.52 | 2022-04-11 04:59:29.232 [rank:6] [train], epoch: 28/50, iter: 100/834, loss: 0.30427, lr: 0.618412, top1: 0.64031, throughput: 312.89 | 2022-04-11 05:00:30.584 [rank:5] [train], epoch: 28/50, iter: 100/834, loss: 0.30174, lr: 0.618412, top1: 0.64599, throughput: 312.78 | 2022-04-11 05:00:30.593 [rank:4] [train], epoch: 28/50, iter: 100/834, loss: 0.30133, lr: 0.618412, top1: 0.64911, throughput: 312.86 | 2022-04-11 05:00:30.602 [rank:7] [train], epoch: 28/50, iter: 100/834, loss: 0.30384, lr: 0.618412, top1: 0.63990, throughput: 312.69 | 2022-04-11 05:00:30.613 [rank:2] [train], epoch: 28/50, iter: 100/834, loss: 0.30463, lr: 0.618412, top1: 0.64073, throughput: 312.45 | 2022-04-11 05:00:30.640 [rank:3] [train], epoch: 28/50, iter: 100/834, loss: 0.30130, lr: 0.618412, top1: 0.64708, throughput: 312.42 | 2022-04-11 05:00:30.647 [rank:0] [train], epoch: 28/50, iter: 100/834, loss: 0.30321, lr: 0.618412, top1: 0.64469, throughput: 312.38 | 2022-04-11 05:00:30.649 [rank:1] [train], epoch: 28/50, iter: 100/834, loss: 0.30639, lr: 0.618412, top1: 0.64068, throughput: 312.27 | 2022-04-11 05:00:30.670 [rank:0] [train], epoch: 28/50, iter: 200/834, loss: 0.30638, lr: 0.612741, top1: 0.63729, throughput: 313.33 | 2022-04-11 05:01:31.926 [rank:4] [train], epoch: 28/50, iter: 200/834, loss: 0.30559, lr: 0.612741, top1: 0.63823, throughput: 312.92 | 2022-04-11 05:01:31.961 [rank:3] [train], epoch: 28/50, iter: 200/834, loss: 0.30485, lr: 0.612741, top1: 0.64068, throughput: 313.10 | 2022-04-11 05:01:31.970 [rank:5] [train], epoch: 28/50, iter: 200/834, loss: 0.30387, lr: 0.612741, top1: 0.64427, throughput: 312.81 | 2022-04-11 05:01:31.972 [rank:2] [train], epoch: 28/50, iter: 200/834, loss: 0.30457, lr: 0.612741, top1: 0.64510, throughput: 312.99 | 2022-04-11 05:01:31.984 [rank:7] [train], epoch: 28/50, iter: 200/834, loss: 0.30691, lr: 0.612741, top1: 0.63156, throughput: 312.84 | 2022-04-11 05:01:31.987 [rank:1] [train], epoch: 28/50, iter: 200/834, loss: 0.30619, lr: 0.612741, top1: 0.63589, throughput: 313.48 | 2022-04-11 05:01:31.918 [rank:6] [train], epoch: 28/50, iter: 200/834, loss: 0.30659, lr: 0.612741, top1: 0.63714, throughput: 312.58 | 2022-04-11 05:01:32.008 [rank:7] [train], epoch: 28/50, iter: 300/834, loss: 0.30609, lr: 0.607079, top1: 0.63542, throughput: 312.31 | 2022-04-11 05:02:33.464 [rank:5] [train], epoch: 28/50, iter: 300/834, loss: 0.30371, lr: 0.607079, top1: 0.64401, throughput: 312.16 | 2022-04-11 05:02:33.478 [rank:6] [train], epoch: 28/50, iter: 300/834, loss: 0.30272, lr: 0.607079, top1: 0.64260, throughput: 312.29 | 2022-04-11 05:02:33.489 [rank:1] [train], epoch: 28/50, iter: 300/834, loss: 0.30651, lr: 0.607079, top1: 0.63641, throughput: 311.80 | 2022-04-11 05:02:33.496 [rank:2] [train], epoch: 28/50, iter: 300/834, loss: 0.30381, lr: 0.607079, top1: 0.64141, throughput: 312.05 | 2022-04-11 05:02:33.513 [rank:3] [train], epoch: 28/50, iter: 300/834, loss: 0.30740, lr: 0.607079, top1: 0.63411, throughput: 311.93 | 2022-04-11 05:02:33.523 [rank:4] [train], epoch: 28/50, iter: 300/834, loss: 0.30736, lr: 0.607079, top1: 0.63344, throughput: 311.83 | 2022-04-11 05:02:33.533 [rank:0] [train], epoch: 28/50, iter: 300/834, loss: 0.30650, lr: 0.607079, top1: 0.63604, throughput: 312.10 | 2022-04-11 05:02:33.446 [rank:4] [train], epoch: 28/50, iter: 400/834, loss: 0.30804, lr: 0.601426, top1: 0.63255, throughput: 313.74 | 2022-04-11 05:03:34.731 [rank:6] [train], epoch: 28/50, iter: 400/834, loss: 0.30357, lr: 0.601426, top1: 0.64276, throughput: 313.47 | 2022-04-11 05:03:34.738 [rank:5] [train], epoch: 28/50, iter: 400/834, loss: 0.30793, lr: 0.601426, top1: 0.62885, throughput: 313.22 | 2022-04-11 05:03:34.778 [rank:2] [train], epoch: 28/50, iter: 400/834, loss: 0.30385, lr: 0.601426, top1: 0.64365, throughput: 313.39 | 2022-04-11 05:03:34.780 [rank:0] [train], epoch: 28/50, iter: 400/834, loss: 0.30538, lr: 0.601426, top1: 0.63693, throughput: 313.03 | 2022-04-11 05:03:34.781 [rank:1] [train], epoch: 28/50, iter: 400/834, loss: 0.30544, lr: 0.601426, top1: 0.63974, throughput: 313.20 | 2022-04-11 05:03:34.799 [rank:3] [train], epoch: 28/50, iter: 400/834, loss: 0.30418, lr: 0.601426, top1: 0.64734, throughput: 313.31 | 2022-04-11 05:03:34.803 [rank:7] [train], epoch: 28/50, iter: 400/834, loss: 0.30914, lr: 0.601426, top1: 0.63417, throughput: 312.89 | 2022-04-11 05:03:34.828 [rank:4] [train], epoch: 28/50, iter: 500/834, loss: 0.30619, lr: 0.595783, top1: 0.63417, throughput: 313.71 | 2022-04-11 05:04:35.933 [rank:1] [train], epoch: 28/50, iter: 500/834, loss: 0.30819, lr: 0.595783, top1: 0.63182, throughput: 313.81 | 2022-04-11 05:04:35.982 [rank:2] [train], epoch: 28/50, iter: 500/834, loss: 0.30592, lr: 0.595783, top1: 0.63927, throughput: 313.70 | 2022-04-11 05:04:35.985 [rank:0] [train], epoch: 28/50, iter: 500/834, loss: 0.30373, lr: 0.595783, top1: 0.63620, throughput: 313.62 | 2022-04-11 05:04:36.001 [rank:5] [train], epoch: 28/50, iter: 500/834, loss: 0.30776, lr: 0.595783, top1: 0.63526, throughput: 313.60 | 2022-04-11 05:04:36.003 [rank:7] [train], epoch: 28/50, iter: 500/834, loss: 0.30582, lr: 0.595783, top1: 0.63854, throughput: 313.84 | 2022-04-11 05:04:36.005 [rank:3] [train], epoch: 28/50, iter: 500/834, loss: 0.30784, lr: 0.595783, top1: 0.63479, throughput: 313.65 | 2022-04-11 05:04:36.018 [rank:6] [train], epoch: 28/50, iter: 500/834, loss: 0.30802, lr: 0.595783, top1: 0.63490, throughput: 313.24 | 2022-04-11 05:04:36.033 [rank:4] [train], epoch: 28/50, iter: 600/834, loss: 0.30491, lr: 0.590149, top1: 0.64026, throughput: 313.36 | 2022-04-11 05:05:37.204 [rank:6] [train], epoch: 28/50, iter: 600/834, loss: 0.30916, lr: 0.590149, top1: 0.63250, throughput: 313.76 | 2022-04-11 05:05:37.225 [rank:5] [train], epoch: 28/50, iter: 600/834, loss: 0.30807, lr: 0.590149, top1: 0.63672, throughput: 313.46 | 2022-04-11 05:05:37.254 [rank:7] [train], epoch: 28/50, iter: 600/834, loss: 0.30914, lr: 0.590149, top1: 0.63208, throughput: 313.27 | 2022-04-11 05:05:37.295 [rank:1] [train], epoch: 28/50, iter: 600/834, loss: 0.30658, lr: 0.590149, top1: 0.63583, throughput: 313.15 | 2022-04-11 05:05:37.295 [rank:2] [train], epoch: 28/50, iter: 600/834, loss: 0.30676, lr: 0.590149, top1: 0.63651, throughput: 313.16 | 2022-04-11 05:05:37.296 [rank:3] [train], epoch: 28/50, iter: 600/834, loss: 0.30671, lr: 0.590149, top1: 0.63755, throughput: 313.24 | 2022-04-11 05:05:37.314 [rank:0] [train], epoch: 28/50, iter: 600/834, loss: 0.31043, lr: 0.590149, top1: 0.63104, throughput: 313.08 | 2022-04-11 05:05:37.328 [rank:1] [train], epoch: 28/50, iter: 700/834, loss: 0.30695, lr: 0.584525, top1: 0.63703, throughput: 313.27 | 2022-04-11 05:06:38.583 [rank:4] [train], epoch: 28/50, iter: 700/834, loss: 0.30847, lr: 0.584525, top1: 0.63750, throughput: 312.77 | 2022-04-11 05:06:38.592 [rank:2] [train], epoch: 28/50, iter: 700/834, loss: 0.30472, lr: 0.584525, top1: 0.64349, throughput: 313.11 | 2022-04-11 05:06:38.616 [rank:0] [train], epoch: 28/50, iter: 700/834, loss: 0.30779, lr: 0.584525, top1: 0.63547, throughput: 313.24 | 2022-04-11 05:06:38.623 [rank:7] [train], epoch: 28/50, iter: 700/834, loss: 0.30720, lr: 0.584525, top1: 0.63594, throughput: 312.99 | 2022-04-11 05:06:38.638 [rank:6] [train], epoch: 28/50, iter: 700/834, loss: 0.30762, lr: 0.584525, top1: 0.63656, throughput: 312.64 | 2022-04-11 05:06:38.638 [rank:3] [train], epoch: 28/50, iter: 700/834, loss: 0.30625, lr: 0.584525, top1: 0.63734, throughput: 313.02 | 2022-04-11 05:06:38.652 [rank:5] [train], epoch: 28/50, iter: 700/834, loss: 0.30566, lr: 0.584525, top1: 0.63922, throughput: 312.99 | 2022-04-11 05:06:38.599 [rank:5] [train], epoch: 28/50, iter: 800/834, loss: 0.30624, lr: 0.578912, top1: 0.63932, throughput: 313.67 | 2022-04-11 05:07:39.810 [rank:2] [train], epoch: 28/50, iter: 800/834, loss: 0.30666, lr: 0.578912, top1: 0.64057, throughput: 313.29 | 2022-04-11 05:07:39.900 [rank:7] [train], epoch: 28/50, iter: 800/834, loss: 0.30967, lr: 0.578912, top1: 0.63495, throughput: 313.39 | 2022-04-11 05:07:39.903 [rank:1] [train], epoch: 28/50, iter: 800/834, loss: 0.30844, lr: 0.578912, top1: 0.63302, throughput: 312.99 | 2022-04-11 05:07:39.927 [rank:0] [train], epoch: 28/50, iter: 800/834, loss: 0.30619, lr: 0.578912, top1: 0.63698, throughput: 313.14 | 2022-04-11 05:07:39.937 [rank:3] [train], epoch: 28/50, iter: 800/834, loss: 0.30568, lr: 0.578912, top1: 0.63974, throughput: 313.27 | 2022-04-11 05:07:39.940 [rank:6] [train], epoch: 28/50, iter: 800/834, loss: 0.30817, lr: 0.578912, top1: 0.63438, throughput: 313.20 | 2022-04-11 05:07:39.941 [rank:4] [train], epoch: 28/50, iter: 800/834, loss: 0.30755, lr: 0.578912, top1: 0.63276, throughput: 313.37 | 2022-04-11 05:07:39.862 [rank:2] [train], epoch: 28/50, iter: 834/834, loss: 0.30678, lr: 0.577006, top1: 0.64216, throughput: 312.92 | 2022-04-11 05:08:00.762 [rank:5] [train], epoch: 28/50, iter: 834/834, loss: 0.30008, lr: 0.577006, top1: 0.65303, throughput: 311.51 | 2022-04-11 05:08:00.766 [rank:0] [train], epoch: 28/50, iter: 834/834, loss: 0.30783, lr: 0.577006, top1: 0.63388, throughput: 313.26 | 2022-04-11 05:08:00.776 [rank:6] [train], epoch: 28/50, iter: 834/834, loss: 0.30770, lr: 0.577006, top1: 0.63358, throughput: 313.28 | 2022-04-11 05:08:00.779 [rank:4] [train], epoch: 28/50, iter: 834/834, loss: 0.30374, lr: 0.577006, top1: 0.64292, throughput: 312.00 | 2022-04-11 05:08:00.785 [rank:1] [train], epoch: 28/50, iter: 834/834, loss: 0.30488, lr: 0.577006, top1: 0.64062, throughput: 312.95 | 2022-04-11 05:08:00.787 [rank:7] [train], epoch: 28/50, iter: 834/834, loss: 0.30903, lr: 0.577006, top1: 0.62730, throughput: 312.19 | 2022-04-11 05:08:00.814 [rank:3] [train], epoch: 28/50, iter: 834/834, loss: 0.30849, lr: 0.577006, top1: 0.63618, throughput: 312.69 | 2022-04-11 05:08:00.818 [rank:0] [eval], epoch: 28/50, iter: 125/125, loss: 0.00000, lr: 0.577006, top1: 0.64960, throughput: 488.80 | 2022-04-11 05:08:13.562 [rank:1] [eval], epoch: 28/50, iter: 125/125, loss: 0.00000, lr: 0.577006, top1: 0.65216, throughput: 488.95 | 2022-04-11 05:08:13.570 [rank:3] [eval], epoch: 28/50, iter: 125/125, loss: 0.00000, lr: 0.577006, top1: 0.63920, throughput: 489.65 | 2022-04-11 05:08:13.582 [rank:2] [eval], epoch: 28/50, iter: 125/125, loss: 0.00000, lr: 0.577006, top1: 0.64224, throughput: 487.49 | 2022-04-11 05:08:13.582 [rank:7] [eval], epoch: 28/50, iter: 125/125, loss: 0.00000, lr: 0.577006, top1: 0.64704, throughput: 489.16 | 2022-04-11 05:08:13.591 [rank:5] [eval], epoch: 28/50, iter: 125/125, loss: 0.00000, lr: 0.577006, top1: 0.64048, throughput: 487.32 | 2022-04-11 05:08:13.592 [rank:6] [eval], epoch: 28/50, iter: 125/125, loss: 0.00000, lr: 0.577006, top1: 0.63968, throughput: 486.82 | 2022-04-11 05:08:13.617 [rank:4] [eval], epoch: 28/50, iter: 125/125, loss: 0.00000, lr: 0.577006, top1: 0.63904, throughput: 486.40 | 2022-04-11 05:08:13.635 [rank:0] [train], epoch: 29/50, iter: 100/834, loss: 0.30337, lr: 0.571407, top1: 0.64172, throughput: 313.22 | 2022-04-11 05:09:14.860 [rank:4] [train], epoch: 29/50, iter: 100/834, loss: 0.30272, lr: 0.571407, top1: 0.64422, throughput: 313.48 | 2022-04-11 05:09:14.883 [rank:6] [train], epoch: 29/50, iter: 100/834, loss: 0.30210, lr: 0.571407, top1: 0.64771, throughput: 313.18 | 2022-04-11 05:09:14.924 [rank:5] [train], epoch: 29/50, iter: 100/834, loss: 0.29987, lr: 0.571407, top1: 0.65229, throughput: 313.02 | 2022-04-11 05:09:14.930 [rank:1] [train], epoch: 29/50, iter: 100/834, loss: 0.30278, lr: 0.571407, top1: 0.64526, throughput: 312.90 | 2022-04-11 05:09:14.932 [rank:3] [train], epoch: 29/50, iter: 100/834, loss: 0.30025, lr: 0.571407, top1: 0.64932, throughput: 312.87 | 2022-04-11 05:09:14.948 [rank:7] [train], epoch: 29/50, iter: 100/834, loss: 0.29908, lr: 0.571407, top1: 0.65391, throughput: 312.91 | 2022-04-11 05:09:14.951 [rank:2] [train], epoch: 29/50, iter: 100/834, loss: 0.29883, lr: 0.571407, top1: 0.65250, throughput: 313.27 | 2022-04-11 05:09:14.871 [rank:2] [train], epoch: 29/50, iter: 200/834, loss: 0.29902, lr: 0.565820, top1: 0.65203, throughput: 312.03 | 2022-04-11 05:10:16.405 [rank:7] [train], epoch: 29/50, iter: 200/834, loss: 0.29959, lr: 0.565820, top1: 0.65167, throughput: 312.24 | 2022-04-11 05:10:16.441 [rank:4] [train], epoch: 29/50, iter: 200/834, loss: 0.30076, lr: 0.565820, top1: 0.64333, throughput: 311.90 | 2022-04-11 05:10:16.442 [rank:6] [train], epoch: 29/50, iter: 200/834, loss: 0.30128, lr: 0.565820, top1: 0.64656, throughput: 312.04 | 2022-04-11 05:10:16.455 [rank:3] [train], epoch: 29/50, iter: 200/834, loss: 0.30224, lr: 0.565820, top1: 0.64333, throughput: 312.13 | 2022-04-11 05:10:16.461 [rank:0] [train], epoch: 29/50, iter: 200/834, loss: 0.30128, lr: 0.565820, top1: 0.64599, throughput: 311.56 | 2022-04-11 05:10:16.486 [rank:5] [train], epoch: 29/50, iter: 200/834, loss: 0.30482, lr: 0.565820, top1: 0.64057, throughput: 311.90 | 2022-04-11 05:10:16.488 [rank:1] [train], epoch: 29/50, iter: 200/834, loss: 0.30489, lr: 0.565820, top1: 0.63792, throughput: 312.31 | 2022-04-11 05:10:16.409 [rank:6] [train], epoch: 29/50, iter: 300/834, loss: 0.30491, lr: 0.560244, top1: 0.64000, throughput: 313.72 | 2022-04-11 05:11:17.655 [rank:2] [train], epoch: 29/50, iter: 300/834, loss: 0.30283, lr: 0.560244, top1: 0.64870, throughput: 313.44 | 2022-04-11 05:11:17.660 [rank:3] [train], epoch: 29/50, iter: 300/834, loss: 0.30360, lr: 0.560244, top1: 0.64281, throughput: 313.69 | 2022-04-11 05:11:17.667 [rank:0] [train], epoch: 29/50, iter: 300/834, loss: 0.30044, lr: 0.560244, top1: 0.64693, throughput: 313.78 | 2022-04-11 05:11:17.676 [rank:1] [train], epoch: 29/50, iter: 300/834, loss: 0.30426, lr: 0.560244, top1: 0.64177, throughput: 313.22 | 2022-04-11 05:11:17.708 [rank:4] [train], epoch: 29/50, iter: 300/834, loss: 0.30206, lr: 0.560244, top1: 0.64443, throughput: 313.34 | 2022-04-11 05:11:17.718 [rank:7] [train], epoch: 29/50, iter: 300/834, loss: 0.30437, lr: 0.560244, top1: 0.64573, throughput: 313.29 | 2022-04-11 05:11:17.727 [rank:5] [train], epoch: 29/50, iter: 300/834, loss: 0.30364, lr: 0.560244, top1: 0.64021, throughput: 313.87 | 2022-04-11 05:11:17.661 [rank:5] [train], epoch: 29/50, iter: 400/834, loss: 0.30439, lr: 0.554680, top1: 0.64526, throughput: 312.89 | 2022-04-11 05:12:19.024 [rank:6] [train], epoch: 29/50, iter: 400/834, loss: 0.30192, lr: 0.554680, top1: 0.64839, throughput: 312.80 | 2022-04-11 05:12:19.037 [rank:3] [train], epoch: 29/50, iter: 400/834, loss: 0.30270, lr: 0.554680, top1: 0.64630, throughput: 312.78 | 2022-04-11 05:12:19.053 [rank:4] [train], epoch: 29/50, iter: 400/834, loss: 0.30276, lr: 0.554680, top1: 0.64620, throughput: 312.95 | 2022-04-11 05:12:19.070 [rank:0] [train], epoch: 29/50, iter: 400/834, loss: 0.30439, lr: 0.554680, top1: 0.64198, throughput: 312.63 | 2022-04-11 05:12:19.089 [rank:2] [train], epoch: 29/50, iter: 400/834, loss: 0.30708, lr: 0.554680, top1: 0.63505, throughput: 312.55 | 2022-04-11 05:12:19.089 [rank:7] [train], epoch: 29/50, iter: 400/834, loss: 0.30550, lr: 0.554680, top1: 0.63599, throughput: 312.88 | 2022-04-11 05:12:19.092 [rank:1] [train], epoch: 29/50, iter: 400/834, loss: 0.30345, lr: 0.554680, top1: 0.64219, throughput: 312.58 | 2022-04-11 05:12:19.133 [rank:2] [train], epoch: 29/50, iter: 500/834, loss: 0.30106, lr: 0.549127, top1: 0.64766, throughput: 314.62 | 2022-04-11 05:13:20.115 [rank:5] [train], epoch: 29/50, iter: 500/834, loss: 0.30262, lr: 0.549127, top1: 0.64620, throughput: 314.23 | 2022-04-11 05:13:20.127 [rank:1] [train], epoch: 29/50, iter: 500/834, loss: 0.30305, lr: 0.549127, top1: 0.64089, throughput: 314.78 | 2022-04-11 05:13:20.128 [rank:7] [train], epoch: 29/50, iter: 500/834, loss: 0.30151, lr: 0.549127, top1: 0.64422, throughput: 314.42 | 2022-04-11 05:13:20.157 [rank:6] [train], epoch: 29/50, iter: 500/834, loss: 0.30245, lr: 0.549127, top1: 0.64224, throughput: 314.03 | 2022-04-11 05:13:20.177 [rank:0] [train], epoch: 29/50, iter: 500/834, loss: 0.30191, lr: 0.549127, top1: 0.64870, throughput: 314.27 | 2022-04-11 05:13:20.184 [rank:3] [train], epoch: 29/50, iter: 500/834, loss: 0.30373, lr: 0.549127, top1: 0.64214, throughput: 314.07 | 2022-04-11 05:13:20.186 [rank:4] [train], epoch: 29/50, iter: 500/834, loss: 0.30169, lr: 0.549127, top1: 0.64328, throughput: 314.12 | 2022-04-11 05:13:20.193 [rank:7] [train], epoch: 29/50, iter: 600/834, loss: 0.30321, lr: 0.543588, top1: 0.64438, throughput: 313.01 | 2022-04-11 05:14:21.496 [rank:4] [train], epoch: 29/50, iter: 600/834, loss: 0.30402, lr: 0.543588, top1: 0.63708, throughput: 313.10 | 2022-04-11 05:14:21.514 [rank:2] [train], epoch: 29/50, iter: 600/834, loss: 0.30403, lr: 0.543588, top1: 0.64255, throughput: 312.68 | 2022-04-11 05:14:21.519 [rank:1] [train], epoch: 29/50, iter: 600/834, loss: 0.30431, lr: 0.543588, top1: 0.64094, throughput: 312.74 | 2022-04-11 05:14:21.521 [rank:5] [train], epoch: 29/50, iter: 600/834, loss: 0.30363, lr: 0.543588, top1: 0.64807, throughput: 312.69 | 2022-04-11 05:14:21.529 [rank:6] [train], epoch: 29/50, iter: 600/834, loss: 0.30292, lr: 0.543588, top1: 0.64490, throughput: 312.80 | 2022-04-11 05:14:21.558 [rank:3] [train], epoch: 29/50, iter: 600/834, loss: 0.30252, lr: 0.543588, top1: 0.64625, throughput: 312.76 | 2022-04-11 05:14:21.575 [rank:0] [train], epoch: 29/50, iter: 600/834, loss: 0.30323, lr: 0.543588, top1: 0.64099, throughput: 312.72 | 2022-04-11 05:14:21.580 [rank:5] [train], epoch: 29/50, iter: 700/834, loss: 0.30229, lr: 0.538061, top1: 0.64536, throughput: 315.09 | 2022-04-11 05:15:22.464 [rank:6] [train], epoch: 29/50, iter: 700/834, loss: 0.30057, lr: 0.538061, top1: 0.64880, throughput: 314.87 | 2022-04-11 05:15:22.535 [rank:4] [train], epoch: 29/50, iter: 700/834, loss: 0.30307, lr: 0.538061, top1: 0.64193, throughput: 314.58 | 2022-04-11 05:15:22.548 [rank:2] [train], epoch: 29/50, iter: 700/834, loss: 0.30379, lr: 0.538061, top1: 0.64484, throughput: 314.50 | 2022-04-11 05:15:22.568 [rank:1] [train], epoch: 29/50, iter: 700/834, loss: 0.30199, lr: 0.538061, top1: 0.64385, throughput: 314.46 | 2022-04-11 05:15:22.579 [rank:3] [train], epoch: 29/50, iter: 700/834, loss: 0.30433, lr: 0.538061, top1: 0.64187, throughput: 314.73 | 2022-04-11 05:15:22.579 [rank:7] [train], epoch: 29/50, iter: 700/834, loss: 0.30349, lr: 0.538061, top1: 0.64068, throughput: 314.29 | 2022-04-11 05:15:22.586 [rank:0] [train], epoch: 29/50, iter: 700/834, loss: 0.30459, lr: 0.538061, top1: 0.63875, throughput: 314.53 | 2022-04-11 05:15:22.624 [rank:4] [train], epoch: 29/50, iter: 800/834, loss: 0.30243, lr: 0.532547, top1: 0.64479, throughput: 313.59 | 2022-04-11 05:16:23.774 [rank:5] [train], epoch: 29/50, iter: 800/834, loss: 0.30317, lr: 0.532547, top1: 0.64266, throughput: 312.61 | 2022-04-11 05:16:23.882 [rank:0] [train], epoch: 29/50, iter: 800/834, loss: 0.30356, lr: 0.532547, top1: 0.64125, throughput: 313.41 | 2022-04-11 05:16:23.885 [rank:6] [train], epoch: 29/50, iter: 800/834, loss: 0.30340, lr: 0.532547, top1: 0.64198, throughput: 312.90 | 2022-04-11 05:16:23.896 [rank:2] [train], epoch: 29/50, iter: 800/834, loss: 0.30029, lr: 0.532547, top1: 0.65010, throughput: 313.07 | 2022-04-11 05:16:23.895 [rank:1] [train], epoch: 29/50, iter: 800/834, loss: 0.30260, lr: 0.532547, top1: 0.64229, throughput: 313.11 | 2022-04-11 05:16:23.898 [rank:3] [train], epoch: 29/50, iter: 800/834, loss: 0.30472, lr: 0.532547, top1: 0.64156, throughput: 312.93 | 2022-04-11 05:16:23.935 [rank:7] [train], epoch: 29/50, iter: 800/834, loss: 0.30689, lr: 0.532547, top1: 0.63396, throughput: 312.83 | 2022-04-11 05:16:23.962 [rank:6] [train], epoch: 29/50, iter: 834/834, loss: 0.30901, lr: 0.530675, top1: 0.63235, throughput: 315.04 | 2022-04-11 05:16:44.617 [rank:5] [train], epoch: 29/50, iter: 834/834, loss: 0.30139, lr: 0.530675, top1: 0.64262, throughput: 314.81 | 2022-04-11 05:16:44.618 [rank:1] [train], epoch: 29/50, iter: 834/834, loss: 0.30284, lr: 0.530675, top1: 0.64139, throughput: 314.67 | 2022-04-11 05:16:44.644 [rank:2] [train], epoch: 29/50, iter: 834/834, loss: 0.30437, lr: 0.530675, top1: 0.64522, throughput: 314.39 | 2022-04-11 05:16:44.659 [rank:0] [train], epoch: 29/50, iter: 834/834, loss: 0.30310, lr: 0.530675, top1: 0.64093, throughput: 314.22 | 2022-04-11 05:16:44.661 [rank:7] [train], epoch: 29/50, iter: 834/834, loss: 0.30850, lr: 0.530675, top1: 0.63404, throughput: 315.34 | 2022-04-11 05:16:44.664 [rank:3] [train], epoch: 29/50, iter: 834/834, loss: 0.30435, lr: 0.530675, top1: 0.64369, throughput: 314.82 | 2022-04-11 05:16:44.670 [rank:4] [train], epoch: 29/50, iter: 834/834, loss: 0.30274, lr: 0.530675, top1: 0.63925, throughput: 311.93 | 2022-04-11 05:16:44.702 [rank:0] [eval], epoch: 29/50, iter: 125/125, loss: 0.00000, lr: 0.530675, top1: 0.64880, throughput: 483.76 | 2022-04-11 05:16:57.580 [rank:1] [eval], epoch: 29/50, iter: 125/125, loss: 0.00000, lr: 0.530675, top1: 0.65264, throughput: 483.04 | 2022-04-11 05:16:57.583 [rank:2] [eval], epoch: 29/50, iter: 125/125, loss: 0.00000, lr: 0.530675, top1: 0.64416, throughput: 483.49 | 2022-04-11 05:16:57.586 [rank:3] [eval], epoch: 29/50, iter: 125/125, loss: 0.00000, lr: 0.530675, top1: 0.64400, throughput: 483.47 | 2022-04-11 05:16:57.598 [rank:7] [eval], epoch: 29/50, iter: 125/125, loss: 0.00000, lr: 0.530675, top1: 0.65456, throughput: 483.02 | 2022-04-11 05:16:57.604 [rank:5] [eval], epoch: 29/50, iter: 125/125, loss: 0.00000, lr: 0.530675, top1: 0.63328, throughput: 481.29 | 2022-04-11 05:16:57.604 [rank:6] [eval], epoch: 29/50, iter: 125/125, loss: 0.00000, lr: 0.530675, top1: 0.64576, throughput: 480.55 | 2022-04-11 05:16:57.623 [rank:4] [eval], epoch: 29/50, iter: 125/125, loss: 0.00000, lr: 0.530675, top1: 0.64976, throughput: 483.65 | 2022-04-11 05:16:57.625 [rank:5] [train], epoch: 30/50, iter: 100/834, loss: 0.29923, lr: 0.525179, top1: 0.65000, throughput: 312.76 | 2022-04-11 05:17:58.993 [rank:2] [train], epoch: 30/50, iter: 100/834, loss: 0.29822, lr: 0.525179, top1: 0.65589, throughput: 312.58 | 2022-04-11 05:17:59.009 [rank:4] [train], epoch: 30/50, iter: 100/834, loss: 0.29988, lr: 0.525179, top1: 0.65156, throughput: 312.74 | 2022-04-11 05:17:59.018 [rank:0] [train], epoch: 30/50, iter: 100/834, loss: 0.29742, lr: 0.525179, top1: 0.65297, throughput: 312.45 | 2022-04-11 05:17:59.030 [rank:3] [train], epoch: 30/50, iter: 100/834, loss: 0.30034, lr: 0.525179, top1: 0.64687, throughput: 312.35 | 2022-04-11 05:17:59.068 [rank:6] [train], epoch: 30/50, iter: 100/834, loss: 0.29839, lr: 0.525179, top1: 0.65234, throughput: 312.46 | 2022-04-11 05:17:59.071 [rank:7] [train], epoch: 30/50, iter: 100/834, loss: 0.29708, lr: 0.525179, top1: 0.65490, throughput: 312.70 | 2022-04-11 05:17:59.004 [rank:1] [train], epoch: 30/50, iter: 100/834, loss: 0.29642, lr: 0.525179, top1: 0.65552, throughput: 312.59 | 2022-04-11 05:17:59.005 [rank:6] [train], epoch: 30/50, iter: 200/834, loss: 0.29538, lr: 0.519697, top1: 0.66000, throughput: 313.91 | 2022-04-11 05:19:00.236 [rank:4] [train], epoch: 30/50, iter: 200/834, loss: 0.29753, lr: 0.519697, top1: 0.65010, throughput: 313.57 | 2022-04-11 05:19:00.249 [rank:1] [train], epoch: 30/50, iter: 200/834, loss: 0.29938, lr: 0.519697, top1: 0.64802, throughput: 313.49 | 2022-04-11 05:19:00.250 [rank:7] [train], epoch: 30/50, iter: 200/834, loss: 0.30065, lr: 0.519697, top1: 0.64755, throughput: 313.44 | 2022-04-11 05:19:00.260 [rank:2] [train], epoch: 30/50, iter: 200/834, loss: 0.29766, lr: 0.519697, top1: 0.65312, throughput: 313.83 | 2022-04-11 05:19:00.189 [rank:3] [train], epoch: 30/50, iter: 200/834, loss: 0.29583, lr: 0.519697, top1: 0.65891, throughput: 313.68 | 2022-04-11 05:19:00.276 [rank:5] [train], epoch: 30/50, iter: 200/834, loss: 0.30067, lr: 0.519697, top1: 0.64578, throughput: 313.27 | 2022-04-11 05:19:00.283 [rank:0] [train], epoch: 30/50, iter: 200/834, loss: 0.29533, lr: 0.519697, top1: 0.66193, throughput: 313.37 | 2022-04-11 05:19:00.300 [rank:0] [train], epoch: 30/50, iter: 300/834, loss: 0.30042, lr: 0.514229, top1: 0.65260, throughput: 313.74 | 2022-04-11 05:20:01.497 [rank:4] [train], epoch: 30/50, iter: 300/834, loss: 0.30146, lr: 0.514229, top1: 0.64740, throughput: 313.30 | 2022-04-11 05:20:01.533 [rank:5] [train], epoch: 30/50, iter: 300/834, loss: 0.29812, lr: 0.514229, top1: 0.65286, throughput: 313.46 | 2022-04-11 05:20:01.534 [rank:2] [train], epoch: 30/50, iter: 300/834, loss: 0.29871, lr: 0.514229, top1: 0.65208, throughput: 312.94 | 2022-04-11 05:20:01.544 [rank:1] [train], epoch: 30/50, iter: 300/834, loss: 0.30165, lr: 0.514229, top1: 0.64745, throughput: 313.24 | 2022-04-11 05:20:01.545 [rank:7] [train], epoch: 30/50, iter: 300/834, loss: 0.30040, lr: 0.514229, top1: 0.65141, throughput: 313.18 | 2022-04-11 05:20:01.567 [rank:6] [train], epoch: 30/50, iter: 300/834, loss: 0.30018, lr: 0.514229, top1: 0.64870, throughput: 313.49 | 2022-04-11 05:20:01.483 [rank:3] [train], epoch: 30/50, iter: 300/834, loss: 0.30040, lr: 0.514229, top1: 0.65292, throughput: 313.66 | 2022-04-11 05:20:01.488 [rank:7] [train], epoch: 30/50, iter: 400/834, loss: 0.29899, lr: 0.508775, top1: 0.65224, throughput: 311.49 | 2022-04-11 05:21:03.206 [rank:1] [train], epoch: 30/50, iter: 400/834, loss: 0.30200, lr: 0.508775, top1: 0.64443, throughput: 311.32 | 2022-04-11 05:21:03.218 [rank:6] [train], epoch: 30/50, iter: 400/834, loss: 0.29676, lr: 0.508775, top1: 0.65557, throughput: 310.96 | 2022-04-11 05:21:03.228 [rank:4] [train], epoch: 30/50, iter: 400/834, loss: 0.30051, lr: 0.508775, top1: 0.64656, throughput: 311.10 | 2022-04-11 05:21:03.249 [rank:0] [train], epoch: 30/50, iter: 400/834, loss: 0.29851, lr: 0.508775, top1: 0.64964, throughput: 310.87 | 2022-04-11 05:21:03.259 [rank:5] [train], epoch: 30/50, iter: 400/834, loss: 0.29747, lr: 0.508775, top1: 0.65151, throughput: 311.01 | 2022-04-11 05:21:03.269 [rank:3] [train], epoch: 30/50, iter: 400/834, loss: 0.29794, lr: 0.508775, top1: 0.65224, throughput: 310.77 | 2022-04-11 05:21:03.271 [rank:2] [train], epoch: 30/50, iter: 400/834, loss: 0.29963, lr: 0.508775, top1: 0.65161, throughput: 311.03 | 2022-04-11 05:21:03.274 [rank:2] [train], epoch: 30/50, iter: 500/834, loss: 0.30115, lr: 0.503336, top1: 0.64615, throughput: 314.18 | 2022-04-11 05:22:04.386 [rank:5] [train], epoch: 30/50, iter: 500/834, loss: 0.30062, lr: 0.503336, top1: 0.64953, throughput: 314.09 | 2022-04-11 05:22:04.398 [rank:3] [train], epoch: 30/50, iter: 500/834, loss: 0.30013, lr: 0.503336, top1: 0.65083, throughput: 314.03 | 2022-04-11 05:22:04.412 [rank:6] [train], epoch: 30/50, iter: 500/834, loss: 0.30023, lr: 0.503336, top1: 0.64703, throughput: 313.79 | 2022-04-11 05:22:04.415 [rank:4] [train], epoch: 30/50, iter: 500/834, loss: 0.29921, lr: 0.503336, top1: 0.65260, throughput: 313.72 | 2022-04-11 05:22:04.451 [rank:1] [train], epoch: 30/50, iter: 500/834, loss: 0.30094, lr: 0.503336, top1: 0.64693, throughput: 313.95 | 2022-04-11 05:22:04.375 [rank:7] [train], epoch: 30/50, iter: 500/834, loss: 0.29720, lr: 0.503336, top1: 0.65422, throughput: 313.39 | 2022-04-11 05:22:04.471 [rank:0] [train], epoch: 30/50, iter: 500/834, loss: 0.30189, lr: 0.503336, top1: 0.64474, throughput: 313.61 | 2022-04-11 05:22:04.482 [rank:2] [train], epoch: 30/50, iter: 600/834, loss: 0.30122, lr: 0.497912, top1: 0.64589, throughput: 312.39 | 2022-04-11 05:23:05.846 [rank:7] [train], epoch: 30/50, iter: 600/834, loss: 0.29788, lr: 0.497912, top1: 0.65323, throughput: 312.73 | 2022-04-11 05:23:05.865 [rank:4] [train], epoch: 30/50, iter: 600/834, loss: 0.30072, lr: 0.497912, top1: 0.64937, throughput: 312.62 | 2022-04-11 05:23:05.866 [rank:5] [train], epoch: 30/50, iter: 600/834, loss: 0.29943, lr: 0.497912, top1: 0.65068, throughput: 312.34 | 2022-04-11 05:23:05.869 [rank:3] [train], epoch: 30/50, iter: 600/834, loss: 0.30190, lr: 0.497912, top1: 0.64531, throughput: 312.31 | 2022-04-11 05:23:05.889 [rank:1] [train], epoch: 30/50, iter: 600/834, loss: 0.29992, lr: 0.497912, top1: 0.64922, throughput: 312.12 | 2022-04-11 05:23:05.890 [rank:6] [train], epoch: 30/50, iter: 600/834, loss: 0.29996, lr: 0.497912, top1: 0.64901, throughput: 312.20 | 2022-04-11 05:23:05.913 [rank:0] [train], epoch: 30/50, iter: 600/834, loss: 0.29763, lr: 0.497912, top1: 0.65120, throughput: 312.43 | 2022-04-11 05:23:05.937 [rank:0] [train], epoch: 30/50, iter: 700/834, loss: 0.29968, lr: 0.492503, top1: 0.65328, throughput: 314.93 | 2022-04-11 05:24:06.903 [rank:2] [train], epoch: 30/50, iter: 700/834, loss: 0.30052, lr: 0.492503, top1: 0.64781, throughput: 314.42 | 2022-04-11 05:24:06.911 [rank:1] [train], epoch: 30/50, iter: 700/834, loss: 0.29859, lr: 0.492503, top1: 0.65229, throughput: 314.63 | 2022-04-11 05:24:06.914 [rank:6] [train], epoch: 30/50, iter: 700/834, loss: 0.29941, lr: 0.492503, top1: 0.65099, throughput: 314.74 | 2022-04-11 05:24:06.916 [rank:4] [train], epoch: 30/50, iter: 700/834, loss: 0.30085, lr: 0.492503, top1: 0.64620, throughput: 314.47 | 2022-04-11 05:24:06.921 [rank:3] [train], epoch: 30/50, iter: 700/834, loss: 0.29900, lr: 0.492503, top1: 0.64677, throughput: 314.54 | 2022-04-11 05:24:06.930 [rank:5] [train], epoch: 30/50, iter: 700/834, loss: 0.30221, lr: 0.492503, top1: 0.64604, throughput: 314.23 | 2022-04-11 05:24:06.971 [rank:7] [train], epoch: 30/50, iter: 700/834, loss: 0.29888, lr: 0.492503, top1: 0.65089, throughput: 314.16 | 2022-04-11 05:24:06.980 [rank:5] [train], epoch: 30/50, iter: 800/834, loss: 0.30200, lr: 0.487110, top1: 0.64719, throughput: 313.18 | 2022-04-11 05:25:08.278 [rank:0] [train], epoch: 30/50, iter: 800/834, loss: 0.29981, lr: 0.487110, top1: 0.64979, throughput: 312.78 | 2022-04-11 05:25:08.288 [rank:3] [train], epoch: 30/50, iter: 800/834, loss: 0.29741, lr: 0.487110, top1: 0.65604, throughput: 312.91 | 2022-04-11 05:25:08.289 [rank:2] [train], epoch: 30/50, iter: 800/834, loss: 0.30011, lr: 0.487110, top1: 0.64453, throughput: 312.77 | 2022-04-11 05:25:08.298 [rank:4] [train], epoch: 30/50, iter: 800/834, loss: 0.29893, lr: 0.487110, top1: 0.65141, throughput: 312.78 | 2022-04-11 05:25:08.306 [rank:1] [train], epoch: 30/50, iter: 800/834, loss: 0.30185, lr: 0.487110, top1: 0.64589, throughput: 312.55 | 2022-04-11 05:25:08.344 [rank:7] [train], epoch: 30/50, iter: 800/834, loss: 0.29843, lr: 0.487110, top1: 0.65036, throughput: 312.88 | 2022-04-11 05:25:08.345 [rank:6] [train], epoch: 30/50, iter: 800/834, loss: 0.30069, lr: 0.487110, top1: 0.65021, throughput: 312.46 | 2022-04-11 05:25:08.364 [rank:4] [train], epoch: 30/50, iter: 834/834, loss: 0.29773, lr: 0.485280, top1: 0.65288, throughput: 313.33 | 2022-04-11 05:25:29.140 [rank:5] [train], epoch: 30/50, iter: 834/834, loss: 0.29953, lr: 0.485280, top1: 0.64568, throughput: 312.86 | 2022-04-11 05:25:29.143 [rank:2] [train], epoch: 30/50, iter: 834/834, loss: 0.29861, lr: 0.485280, top1: 0.66192, throughput: 313.14 | 2022-04-11 05:25:29.145 [rank:6] [train], epoch: 30/50, iter: 834/834, loss: 0.30003, lr: 0.485280, top1: 0.64369, throughput: 314.11 | 2022-04-11 05:25:29.147 [rank:0] [train], epoch: 30/50, iter: 834/834, loss: 0.30153, lr: 0.485280, top1: 0.65028, throughput: 312.93 | 2022-04-11 05:25:29.148 [rank:1] [train], epoch: 30/50, iter: 834/834, loss: 0.30263, lr: 0.485280, top1: 0.64798, throughput: 313.75 | 2022-04-11 05:25:29.150 [rank:7] [train], epoch: 30/50, iter: 834/834, loss: 0.30399, lr: 0.485280, top1: 0.64767, throughput: 313.73 | 2022-04-11 05:25:29.153 [rank:3] [train], epoch: 30/50, iter: 834/834, loss: 0.30091, lr: 0.485280, top1: 0.65288, throughput: 312.67 | 2022-04-11 05:25:29.168 [rank:0] [eval], epoch: 30/50, iter: 125/125, loss: 0.00000, lr: 0.485280, top1: 0.67632, throughput: 485.71 | 2022-04-11 05:25:42.016 [rank:1] [eval], epoch: 30/50, iter: 125/125, loss: 0.00000, lr: 0.485280, top1: 0.67040, throughput: 485.59 | 2022-04-11 05:25:42.021 [rank:2] [eval], epoch: 30/50, iter: 125/125, loss: 0.00000, lr: 0.485280, top1: 0.66256, throughput: 485.13 | 2022-04-11 05:25:42.028 [rank:3] [eval], epoch: 30/50, iter: 125/125, loss: 0.00000, lr: 0.485280, top1: 0.67232, throughput: 485.75 | 2022-04-11 05:25:42.035 [rank:7] [eval], epoch: 30/50, iter: 125/125, loss: 0.00000, lr: 0.485280, top1: 0.66992, throughput: 484.58 | 2022-04-11 05:25:42.051 [rank:5] [eval], epoch: 30/50, iter: 125/125, loss: 0.00000, lr: 0.485280, top1: 0.66288, throughput: 484.26 | 2022-04-11 05:25:42.050 [rank:4] [eval], epoch: 30/50, iter: 125/125, loss: 0.00000, lr: 0.485280, top1: 0.67840, throughput: 483.64 | 2022-04-11 05:25:42.063 [rank:6] [eval], epoch: 30/50, iter: 125/125, loss: 0.00000, lr: 0.485280, top1: 0.67632, throughput: 483.79 | 2022-04-11 05:25:42.065 [rank:4] [train], epoch: 31/50, iter: 100/834, loss: 0.29354, lr: 0.479909, top1: 0.65750, throughput: 313.08 | 2022-04-11 05:26:43.389 [rank:0] [train], epoch: 31/50, iter: 100/834, loss: 0.29184, lr: 0.479909, top1: 0.66375, throughput: 312.80 | 2022-04-11 05:26:43.397 [rank:5] [train], epoch: 31/50, iter: 100/834, loss: 0.29052, lr: 0.479909, top1: 0.67146, throughput: 312.89 | 2022-04-11 05:26:43.413 [rank:6] [train], epoch: 31/50, iter: 100/834, loss: 0.29485, lr: 0.479909, top1: 0.65969, throughput: 313.35 | 2022-04-11 05:26:43.339 [rank:2] [train], epoch: 31/50, iter: 100/834, loss: 0.29357, lr: 0.479909, top1: 0.66161, throughput: 312.65 | 2022-04-11 05:26:43.439 [rank:3] [train], epoch: 31/50, iter: 100/834, loss: 0.29182, lr: 0.479909, top1: 0.66354, throughput: 312.61 | 2022-04-11 05:26:43.454 [rank:7] [train], epoch: 31/50, iter: 100/834, loss: 0.29327, lr: 0.479909, top1: 0.66260, throughput: 312.63 | 2022-04-11 05:26:43.465 [rank:1] [train], epoch: 31/50, iter: 100/834, loss: 0.29174, lr: 0.479909, top1: 0.66865, throughput: 312.46 | 2022-04-11 05:26:43.468 [rank:1] [train], epoch: 31/50, iter: 200/834, loss: 0.29465, lr: 0.474554, top1: 0.66182, throughput: 313.54 | 2022-04-11 05:27:44.704 [rank:2] [train], epoch: 31/50, iter: 200/834, loss: 0.29423, lr: 0.474554, top1: 0.66089, throughput: 313.36 | 2022-04-11 05:27:44.711 [rank:5] [train], epoch: 31/50, iter: 200/834, loss: 0.29591, lr: 0.474554, top1: 0.65734, throughput: 313.19 | 2022-04-11 05:27:44.717 [rank:3] [train], epoch: 31/50, iter: 200/834, loss: 0.29528, lr: 0.474554, top1: 0.66125, throughput: 313.37 | 2022-04-11 05:27:44.724 [rank:4] [train], epoch: 31/50, iter: 200/834, loss: 0.29424, lr: 0.474554, top1: 0.66474, throughput: 313.01 | 2022-04-11 05:27:44.730 [rank:0] [train], epoch: 31/50, iter: 200/834, loss: 0.29682, lr: 0.474554, top1: 0.65677, throughput: 313.01 | 2022-04-11 05:27:44.737 [rank:7] [train], epoch: 31/50, iter: 200/834, loss: 0.29718, lr: 0.474554, top1: 0.65474, throughput: 313.34 | 2022-04-11 05:27:44.740 [rank:6] [train], epoch: 31/50, iter: 200/834, loss: 0.29510, lr: 0.474554, top1: 0.65635, throughput: 312.54 | 2022-04-11 05:27:44.771 [rank:7] [train], epoch: 31/50, iter: 300/834, loss: 0.29627, lr: 0.469215, top1: 0.65484, throughput: 312.85 | 2022-04-11 05:28:46.112 [rank:0] [train], epoch: 31/50, iter: 300/834, loss: 0.29700, lr: 0.469215, top1: 0.65677, throughput: 312.80 | 2022-04-11 05:28:46.119 [rank:4] [train], epoch: 31/50, iter: 300/834, loss: 0.29657, lr: 0.469215, top1: 0.65656, throughput: 312.65 | 2022-04-11 05:28:46.140 [rank:3] [train], epoch: 31/50, iter: 300/834, loss: 0.29235, lr: 0.469215, top1: 0.66542, throughput: 312.60 | 2022-04-11 05:28:46.144 [rank:5] [train], epoch: 31/50, iter: 300/834, loss: 0.29590, lr: 0.469215, top1: 0.65745, throughput: 312.51 | 2022-04-11 05:28:46.155 [rank:6] [train], epoch: 31/50, iter: 300/834, loss: 0.29664, lr: 0.469215, top1: 0.65443, throughput: 312.77 | 2022-04-11 05:28:46.159 [rank:2] [train], epoch: 31/50, iter: 300/834, loss: 0.29452, lr: 0.469215, top1: 0.65839, throughput: 312.40 | 2022-04-11 05:28:46.171 [rank:1] [train], epoch: 31/50, iter: 300/834, loss: 0.29404, lr: 0.469215, top1: 0.66073, throughput: 312.35 | 2022-04-11 05:28:46.172 [rank:1] [train], epoch: 31/50, iter: 400/834, loss: 0.29538, lr: 0.463893, top1: 0.65812, throughput: 312.59 | 2022-04-11 05:29:47.594 [rank:2] [train], epoch: 31/50, iter: 400/834, loss: 0.29711, lr: 0.463893, top1: 0.65234, throughput: 312.57 | 2022-04-11 05:29:47.597 [rank:7] [train], epoch: 31/50, iter: 400/834, loss: 0.29434, lr: 0.463893, top1: 0.65922, throughput: 312.16 | 2022-04-11 05:29:47.619 [rank:6] [train], epoch: 31/50, iter: 400/834, loss: 0.29677, lr: 0.463893, top1: 0.65177, throughput: 312.33 | 2022-04-11 05:29:47.631 [rank:0] [train], epoch: 31/50, iter: 400/834, loss: 0.29896, lr: 0.463893, top1: 0.65266, throughput: 312.12 | 2022-04-11 05:29:47.633 [rank:4] [train], epoch: 31/50, iter: 400/834, loss: 0.29484, lr: 0.463893, top1: 0.66219, throughput: 312.19 | 2022-04-11 05:29:47.641 [rank:5] [train], epoch: 31/50, iter: 400/834, loss: 0.29666, lr: 0.463893, top1: 0.65443, throughput: 312.22 | 2022-04-11 05:29:47.651 [rank:3] [train], epoch: 31/50, iter: 400/834, loss: 0.29605, lr: 0.463893, top1: 0.65813, throughput: 312.11 | 2022-04-11 05:29:47.661 [rank:2] [train], epoch: 31/50, iter: 500/834, loss: 0.29838, lr: 0.458589, top1: 0.65417, throughput: 311.48 | 2022-04-11 05:30:49.238 [rank:1] [train], epoch: 31/50, iter: 500/834, loss: 0.29700, lr: 0.458589, top1: 0.65589, throughput: 311.14 | 2022-04-11 05:30:49.302 [rank:5] [train], epoch: 31/50, iter: 500/834, loss: 0.29615, lr: 0.458589, top1: 0.65333, throughput: 311.40 | 2022-04-11 05:30:49.308 [rank:6] [train], epoch: 31/50, iter: 500/834, loss: 0.29740, lr: 0.458589, top1: 0.65354, throughput: 311.24 | 2022-04-11 05:30:49.321 [rank:7] [train], epoch: 31/50, iter: 500/834, loss: 0.29632, lr: 0.458589, top1: 0.66161, throughput: 311.15 | 2022-04-11 05:30:49.326 [rank:0] [train], epoch: 31/50, iter: 500/834, loss: 0.29733, lr: 0.458589, top1: 0.65312, throughput: 311.14 | 2022-04-11 05:30:49.342 [rank:4] [train], epoch: 31/50, iter: 500/834, loss: 0.29436, lr: 0.458589, top1: 0.65698, throughput: 311.11 | 2022-04-11 05:30:49.355 [rank:3] [train], epoch: 31/50, iter: 500/834, loss: 0.29568, lr: 0.458589, top1: 0.65578, throughput: 311.05 | 2022-04-11 05:30:49.387 [rank:0] [train], epoch: 31/50, iter: 600/834, loss: 0.29634, lr: 0.453302, top1: 0.65542, throughput: 314.53 | 2022-04-11 05:31:50.386 [rank:4] [train], epoch: 31/50, iter: 600/834, loss: 0.29339, lr: 0.453302, top1: 0.66313, throughput: 314.59 | 2022-04-11 05:31:50.386 [rank:2] [train], epoch: 31/50, iter: 600/834, loss: 0.29678, lr: 0.453302, top1: 0.65302, throughput: 313.99 | 2022-04-11 05:31:50.388 [rank:1] [train], epoch: 31/50, iter: 600/834, loss: 0.29615, lr: 0.453302, top1: 0.65599, throughput: 314.23 | 2022-04-11 05:31:50.403 [rank:5] [train], epoch: 31/50, iter: 600/834, loss: 0.29548, lr: 0.453302, top1: 0.65833, throughput: 314.26 | 2022-04-11 05:31:50.403 [rank:3] [train], epoch: 31/50, iter: 600/834, loss: 0.29797, lr: 0.453302, top1: 0.65224, throughput: 314.50 | 2022-04-11 05:31:50.437 [rank:7] [train], epoch: 31/50, iter: 600/834, loss: 0.29646, lr: 0.453302, top1: 0.65583, throughput: 314.10 | 2022-04-11 05:31:50.453 [rank:6] [train], epoch: 31/50, iter: 600/834, loss: 0.30029, lr: 0.453302, top1: 0.64734, throughput: 313.99 | 2022-04-11 05:31:50.470 [rank:4] [train], epoch: 31/50, iter: 700/834, loss: 0.29564, lr: 0.448033, top1: 0.65724, throughput: 312.35 | 2022-04-11 05:32:51.856 [rank:1] [train], epoch: 31/50, iter: 700/834, loss: 0.29766, lr: 0.448033, top1: 0.65625, throughput: 312.44 | 2022-04-11 05:32:51.856 [rank:6] [train], epoch: 31/50, iter: 700/834, loss: 0.29461, lr: 0.448033, top1: 0.66490, throughput: 312.68 | 2022-04-11 05:32:51.874 [rank:2] [train], epoch: 31/50, iter: 700/834, loss: 0.29662, lr: 0.448033, top1: 0.65573, throughput: 312.20 | 2022-04-11 05:32:51.887 [rank:0] [train], epoch: 31/50, iter: 700/834, loss: 0.29629, lr: 0.448033, top1: 0.65724, throughput: 312.13 | 2022-04-11 05:32:51.899 [rank:5] [train], epoch: 31/50, iter: 700/834, loss: 0.29600, lr: 0.448033, top1: 0.66120, throughput: 312.19 | 2022-04-11 05:32:51.905 [rank:3] [train], epoch: 31/50, iter: 700/834, loss: 0.29665, lr: 0.448033, top1: 0.65729, throughput: 312.26 | 2022-04-11 05:32:51.925 [rank:7] [train], epoch: 31/50, iter: 700/834, loss: 0.29808, lr: 0.448033, top1: 0.65219, throughput: 312.25 | 2022-04-11 05:32:51.941 [rank:5] [train], epoch: 31/50, iter: 800/834, loss: 0.29379, lr: 0.442783, top1: 0.66245, throughput: 315.92 | 2022-04-11 05:33:52.680 [rank:1] [train], epoch: 31/50, iter: 800/834, loss: 0.29635, lr: 0.442783, top1: 0.65391, throughput: 315.58 | 2022-04-11 05:33:52.695 [rank:6] [train], epoch: 31/50, iter: 800/834, loss: 0.29585, lr: 0.442783, top1: 0.65911, throughput: 315.65 | 2022-04-11 05:33:52.701 [rank:2] [train], epoch: 31/50, iter: 800/834, loss: 0.29643, lr: 0.442783, top1: 0.65417, throughput: 315.67 | 2022-04-11 05:33:52.710 [rank:4] [train], epoch: 31/50, iter: 800/834, loss: 0.29748, lr: 0.442783, top1: 0.65281, throughput: 315.46 | 2022-04-11 05:33:52.720 [rank:0] [train], epoch: 31/50, iter: 800/834, loss: 0.29494, lr: 0.442783, top1: 0.65901, throughput: 315.66 | 2022-04-11 05:33:52.723 [rank:7] [train], epoch: 31/50, iter: 800/834, loss: 0.29658, lr: 0.442783, top1: 0.65531, throughput: 315.81 | 2022-04-11 05:33:52.736 [rank:3] [train], epoch: 31/50, iter: 800/834, loss: 0.29894, lr: 0.442783, top1: 0.65396, throughput: 315.67 | 2022-04-11 05:33:52.748 [rank:5] [train], epoch: 31/50, iter: 834/834, loss: 0.30116, lr: 0.441002, top1: 0.64445, throughput: 309.94 | 2022-04-11 05:34:13.742 [rank:4] [train], epoch: 31/50, iter: 834/834, loss: 0.29515, lr: 0.441002, top1: 0.65962, throughput: 310.39 | 2022-04-11 05:34:13.751 [rank:3] [train], epoch: 31/50, iter: 834/834, loss: 0.29304, lr: 0.441002, top1: 0.66437, throughput: 310.60 | 2022-04-11 05:34:13.765 [rank:2] [train], epoch: 31/50, iter: 834/834, loss: 0.29709, lr: 0.441002, top1: 0.65794, throughput: 310.04[rank:0] [train], epoch: 31/50, iter: 834/834, loss: 0.29564, lr: 0.441002, top1: 0.66207, throughput: 310.23 | 2022-04-11 05:34:13.765 | 2022-04-11 05:34:13.765 [rank:1] [train], epoch: 31/50, iter: 834/834, loss: 0.29674, lr: 0.441002, top1: 0.65656, throughput: 309.81 | 2022-04-11 05:34:13.766 [rank:6] [train], epoch: 31/50, iter: 834/834, loss: 0.29472, lr: 0.441002, top1: 0.65074, throughput: 309.79 | 2022-04-11 05:34:13.773 [rank:7] [train], epoch: 31/50, iter: 834/834, loss: 0.29438, lr: 0.441002, top1: 0.65962, throughput: 309.69 | 2022-04-11 05:34:13.815 [rank:0] [eval], epoch: 31/50, iter: 125/125, loss: 0.00000, lr: 0.441002, top1: 0.68176, throughput: 485.06 | 2022-04-11 05:34:26.650 [rank:2] [eval], epoch: 31/50, iter: 125/125, loss: 0.00000, lr: 0.441002, top1: 0.66816, throughput: 484.77 | 2022-04-11 05:34:26.658 [rank:1] [eval], epoch: 31/50, iter: 125/125, loss: 0.00000, lr: 0.441002, top1: 0.67776, throughput: 484.68 | 2022-04-11 05:34:26.661 [rank:5] [eval], epoch: 31/50, iter: 125/125, loss: 0.00000, lr: 0.441002, top1: 0.66336, throughput: 483.33 | 2022-04-11 05:34:26.673 [rank:7] [eval], epoch: 31/50, iter: 125/125, loss: 0.00000, lr: 0.441002, top1: 0.67488, throughput: 485.87 | 2022-04-11 05:34:26.679 [rank:3] [eval], epoch: 31/50, iter: 125/125, loss: 0.00000, lr: 0.441002, top1: 0.66896, throughput: 483.70 | 2022-04-11 05:34:26.687 [rank:4] [eval], epoch: 31/50, iter: 125/125, loss: 0.00000, lr: 0.441002, top1: 0.67648, throughput: 482.75 | 2022-04-11 05:34:26.698 [rank:6] [eval], epoch: 31/50, iter: 125/125, loss: 0.00000, lr: 0.441002, top1: 0.67632, throughput: 483.31 | 2022-04-11 05:34:26.705 [rank:4] [train], epoch: 32/50, iter: 100/834, loss: 0.29298, lr: 0.435776, top1: 0.66578, throughput: 312.65 | 2022-04-11 05:35:28.108 [rank:3] [train], epoch: 32/50, iter: 100/834, loss: 0.28886, lr: 0.435776, top1: 0.67187, throughput: 312.40 | 2022-04-11 05:35:28.145 [rank:5] [train], epoch: 32/50, iter: 100/834, loss: 0.28985, lr: 0.435776, top1: 0.67161, throughput: 312.32 | 2022-04-11 05:35:28.148 [rank:6] [train], epoch: 32/50, iter: 100/834, loss: 0.29383, lr: 0.435776, top1: 0.66281, throughput: 312.40 | 2022-04-11 05:35:28.164 [rank:0] [train], epoch: 32/50, iter: 100/834, loss: 0.29282, lr: 0.435776, top1: 0.66292, throughput: 312.06 | 2022-04-11 05:35:28.177 [rank:1] [train], epoch: 32/50, iter: 100/834, loss: 0.29311, lr: 0.435776, top1: 0.66245, throughput: 312.11 | 2022-04-11 05:35:28.178 [rank:7] [train], epoch: 32/50, iter: 100/834, loss: 0.29346, lr: 0.435776, top1: 0.66604, throughput: 312.19 | 2022-04-11 05:35:28.179 [rank:2] [train], epoch: 32/50, iter: 100/834, loss: 0.29239, lr: 0.435776, top1: 0.66396, throughput: 312.06 | 2022-04-11 05:35:28.186 [rank:4] [train], epoch: 32/50, iter: 200/834, loss: 0.29084, lr: 0.430568, top1: 0.66635, throughput: 311.63 | 2022-04-11 05:36:29.720 [rank:2] [train], epoch: 32/50, iter: 200/834, loss: 0.29506, lr: 0.430568, top1: 0.66125, throughput: 311.83 | 2022-04-11 05:36:29.757 [rank:6] [train], epoch: 32/50, iter: 200/834, loss: 0.29246, lr: 0.430568, top1: 0.66453, throughput: 311.72 | 2022-04-11 05:36:29.758 [rank:1] [train], epoch: 32/50, iter: 200/834, loss: 0.29415, lr: 0.430568, top1: 0.65599, throughput: 311.79 | 2022-04-11 05:36:29.759 [rank:7] [train], epoch: 32/50, iter: 200/834, loss: 0.29380, lr: 0.430568, top1: 0.66099, throughput: 311.72 | 2022-04-11 05:36:29.774 [rank:3] [train], epoch: 32/50, iter: 200/834, loss: 0.29229, lr: 0.430568, top1: 0.66396, throughput: 311.55 | 2022-04-11 05:36:29.774 [rank:5] [train], epoch: 32/50, iter: 200/834, loss: 0.29131, lr: 0.430568, top1: 0.66417, throughput: 311.51 | 2022-04-11 05:36:29.784 [rank:0] [train], epoch: 32/50, iter: 200/834, loss: 0.28756, lr: 0.430568, top1: 0.67354, throughput: 311.61 | 2022-04-11 05:36:29.793 [rank:2] [train], epoch: 32/50, iter: 300/834, loss: 0.29075, lr: 0.425380, top1: 0.66849, throughput: 314.46 | 2022-04-11 05:37:30.815 [rank:5] [train], epoch: 32/50, iter: 300/834, loss: 0.29366, lr: 0.425380, top1: 0.66219, throughput: 314.25 | 2022-04-11 05:37:30.882 [rank:4] [train], epoch: 32/50, iter: 300/834, loss: 0.29175, lr: 0.425380, top1: 0.66724, throughput: 313.90 | 2022-04-11 05:37:30.886 [rank:0] [train], epoch: 32/50, iter: 300/834, loss: 0.29134, lr: 0.425380, top1: 0.66786, throughput: 314.19 | 2022-04-11 05:37:30.903 [rank:1] [train], epoch: 32/50, iter: 300/834, loss: 0.29120, lr: 0.425380, top1: 0.66411, throughput: 313.96 | 2022-04-11 05:37:30.912 [rank:3] [train], epoch: 32/50, iter: 300/834, loss: 0.28908, lr: 0.425380, top1: 0.67427, throughput: 314.04 | 2022-04-11 05:37:30.912 [rank:6] [train], epoch: 32/50, iter: 300/834, loss: 0.29398, lr: 0.425380, top1: 0.65865, throughput: 313.96 | 2022-04-11 05:37:30.913 [rank:7] [train], epoch: 32/50, iter: 300/834, loss: 0.29377, lr: 0.425380, top1: 0.66099, throughput: 314.39 | 2022-04-11 05:37:30.845 [rank:2] [train], epoch: 32/50, iter: 400/834, loss: 0.29111, lr: 0.420212, top1: 0.66505, throughput: 312.82 | 2022-04-11 05:38:32.193 [rank:4] [train], epoch: 32/50, iter: 400/834, loss: 0.29238, lr: 0.420212, top1: 0.66516, throughput: 313.00 | 2022-04-11 05:38:32.228 [rank:3] [train], epoch: 32/50, iter: 400/834, loss: 0.29180, lr: 0.420212, top1: 0.66786, throughput: 313.10 | 2022-04-11 05:38:32.234 [rank:6] [train], epoch: 32/50, iter: 400/834, loss: 0.29318, lr: 0.420212, top1: 0.66203, throughput: 313.09 | 2022-04-11 05:38:32.238 [rank:0] [train], epoch: 32/50, iter: 400/834, loss: 0.29503, lr: 0.420212, top1: 0.65854, throughput: 313.04 | 2022-04-11 05:38:32.237 [rank:7] [train], epoch: 32/50, iter: 400/834, loss: 0.29208, lr: 0.420212, top1: 0.66432, throughput: 312.48 | 2022-04-11 05:38:32.289 [rank:1] [train], epoch: 32/50, iter: 400/834, loss: 0.29549, lr: 0.420212, top1: 0.65917, throughput: 312.79 | 2022-04-11 05:38:32.296 [rank:5] [train], epoch: 32/50, iter: 400/834, loss: 0.29474, lr: 0.420212, top1: 0.66219, throughput: 313.05 | 2022-04-11 05:38:32.215 [rank:2] [train], epoch: 32/50, iter: 500/834, loss: 0.29425, lr: 0.415063, top1: 0.66016, throughput: 313.96 | 2022-04-11 05:39:33.348 [rank:4] [train], epoch: 32/50, iter: 500/834, loss: 0.29130, lr: 0.415063, top1: 0.66771, throughput: 314.07 | 2022-04-11 05:39:33.361 [rank:7] [train], epoch: 32/50, iter: 500/834, loss: 0.29280, lr: 0.415063, top1: 0.66464, throughput: 314.34 | 2022-04-11 05:39:33.369 [rank:3] [train], epoch: 32/50, iter: 500/834, loss: 0.29265, lr: 0.415063, top1: 0.66724, throughput: 313.98 | 2022-04-11 05:39:33.385 [rank:6] [train], epoch: 32/50, iter: 500/834, loss: 0.29424, lr: 0.415063, top1: 0.65948, throughput: 313.99 | 2022-04-11 05:39:33.386 [rank:0] [train], epoch: 32/50, iter: 500/834, loss: 0.29258, lr: 0.415063, top1: 0.66745, throughput: 313.96 | 2022-04-11 05:39:33.392 [rank:5] [train], epoch: 32/50, iter: 500/834, loss: 0.29264, lr: 0.415063, top1: 0.66052, throughput: 313.76 | 2022-04-11 05:39:33.408 [rank:1] [train], epoch: 32/50, iter: 500/834, loss: 0.29056, lr: 0.415063, top1: 0.66766, throughput: 314.58 | 2022-04-11 05:39:33.330 [rank:0] [train], epoch: 32/50, iter: 600/834, loss: 0.29165, lr: 0.409934, top1: 0.66422, throughput: 313.21 | 2022-04-11 05:40:34.692 [rank:5] [train], epoch: 32/50, iter: 600/834, loss: 0.29052, lr: 0.409934, top1: 0.66958, throughput: 313.26 | 2022-04-11 05:40:34.699 [rank:1] [train], epoch: 32/50, iter: 600/834, loss: 0.29248, lr: 0.409934, top1: 0.66094, throughput: 312.78 | 2022-04-11 05:40:34.715 [rank:4] [train], epoch: 32/50, iter: 600/834, loss: 0.29516, lr: 0.409934, top1: 0.65672, throughput: 312.93 | 2022-04-11 05:40:34.716 [rank:2] [train], epoch: 32/50, iter: 600/834, loss: 0.29172, lr: 0.409934, top1: 0.66927, throughput: 312.69 | 2022-04-11 05:40:34.751 [rank:6] [train], epoch: 32/50, iter: 600/834, loss: 0.29303, lr: 0.409934, top1: 0.66438, throughput: 312.86 | 2022-04-11 05:40:34.755 [rank:3] [train], epoch: 32/50, iter: 600/834, loss: 0.28999, lr: 0.409934, top1: 0.66958, throughput: 312.76 | 2022-04-11 05:40:34.774 [rank:7] [train], epoch: 32/50, iter: 600/834, loss: 0.29146, lr: 0.409934, top1: 0.66224, throughput: 312.60 | 2022-04-11 05:40:34.789 [rank:4] [train], epoch: 32/50, iter: 700/834, loss: 0.29443, lr: 0.404826, top1: 0.66104, throughput: 314.61 | 2022-04-11 05:41:35.745 [rank:3] [train], epoch: 32/50, iter: 700/834, loss: 0.29299, lr: 0.404826, top1: 0.66109, throughput: 314.88 | 2022-04-11 05:41:35.749 [rank:7] [train], epoch: 32/50, iter: 700/834, loss: 0.29148, lr: 0.404826, top1: 0.66234, throughput: 314.96 | 2022-04-11 05:41:35.749 [rank:2] [train], epoch: 32/50, iter: 700/834, loss: 0.29254, lr: 0.404826, top1: 0.66635, throughput: 314.71 | 2022-04-11 05:41:35.760 [rank:1] [train], epoch: 32/50, iter: 700/834, loss: 0.29437, lr: 0.404826, top1: 0.66151, throughput: 314.41 | 2022-04-11 05:41:35.782 [rank:5] [train], epoch: 32/50, iter: 700/834, loss: 0.29485, lr: 0.404826, top1: 0.65667, throughput: 314.32 | 2022-04-11 05:41:35.783 [rank:6] [train], epoch: 32/50, iter: 700/834, loss: 0.29410, lr: 0.404826, top1: 0.66057, throughput: 314.54 | 2022-04-11 05:41:35.796 [rank:0] [train], epoch: 32/50, iter: 700/834, loss: 0.29327, lr: 0.404826, top1: 0.66177, throughput: 314.21 | 2022-04-11 05:41:35.798 [rank:5] [train], epoch: 32/50, iter: 800/834, loss: 0.29114, lr: 0.399738, top1: 0.66578, throughput: 313.09 | 2022-04-11 05:42:37.109 [rank:6] [train], epoch: 32/50, iter: 800/834, loss: 0.29214, lr: 0.399738, top1: 0.66286, throughput: 313.14 | 2022-04-11 05:42:37.110 [rank:3] [train], epoch: 32/50, iter: 800/834, loss: 0.29355, lr: 0.399738, top1: 0.66448, throughput: 312.84 | 2022-04-11 05:42:37.121 [rank:4] [train], epoch: 32/50, iter: 800/834, loss: 0.29256, lr: 0.399738, top1: 0.66594, throughput: 312.82 | 2022-04-11 05:42:37.123 [rank:2] [train], epoch: 32/50, iter: 800/834, loss: 0.29226, lr: 0.399738, top1: 0.66130, throughput: 313.26 | 2022-04-11 05:42:37.051 [rank:1] [train], epoch: 32/50, iter: 800/834, loss: 0.29277, lr: 0.399738, top1: 0.66339, throughput: 312.95 | 2022-04-11 05:42:37.133 [rank:0] [train], epoch: 32/50, iter: 800/834, loss: 0.29372, lr: 0.399738, top1: 0.65859, throughput: 313.00 | 2022-04-11 05:42:37.140 [rank:7] [train], epoch: 32/50, iter: 800/834, loss: 0.28892, lr: 0.399738, top1: 0.66677, throughput: 312.55 | 2022-04-11 05:42:37.180 [rank:5] [train], epoch: 32/50, iter: 834/834, loss: 0.29137, lr: 0.398013, top1: 0.66820, throughput: 309.92 | 2022-04-11 05:42:58.172 [rank:2] [train], epoch: 32/50, iter: 834/834, loss: 0.29117, lr: 0.398013, top1: 0.66529, throughput: 308.79 | 2022-04-11 05:42:58.192 [rank:1] [train], epoch: 32/50, iter: 834/834, loss: 0.29380, lr: 0.398013, top1: 0.65977, throughput: 309.92 | 2022-04-11 05:42:58.197 [rank:7] [train], epoch: 32/50, iter: 834/834, loss: 0.29216, lr: 0.398013, top1: 0.66376, throughput: 310.49 | 2022-04-11 05:42:58.205 [rank:4] [train], epoch: 32/50, iter: 834/834, loss: 0.29476, lr: 0.398013, top1: 0.65717, throughput: 309.28 | 2022-04-11 05:42:58.230 [rank:3] [train], epoch: 32/50, iter: 834/834, loss: 0.29573, lr: 0.398013, top1: 0.66330, throughput: 309.25 | 2022-04-11 05:42:58.230 [rank:0] [train], epoch: 32/50, iter: 834/834, loss: 0.29308, lr: 0.398013, top1: 0.67249, throughput: 309.44 | 2022-04-11 05:42:58.236 [rank:6] [train], epoch: 32/50, iter: 834/834, loss: 0.29602, lr: 0.398013, top1: 0.66498, throughput: 308.72 | 2022-04-11 05:42:58.256 [rank:0] [eval], epoch: 32/50, iter: 125/125, loss: 0.00000, lr: 0.398013, top1: 0.68688, throughput: 481.87 | 2022-04-11 05:43:11.206 [rank:1] [eval], epoch: 32/50, iter: 125/125, loss: 0.00000, lr: 0.398013, top1: 0.67968, throughput: 480.31 | 2022-04-11 05:43:11.209 [rank:2] [eval], epoch: 32/50, iter: 125/125, loss: 0.00000, lr: 0.398013, top1: 0.67856, throughput: 479.84 | 2022-04-11 05:43:11.217 [rank:5] [eval], epoch: 32/50, iter: 125/125, loss: 0.00000, lr: 0.398013, top1: 0.67600, throughput: 478.71 | 2022-04-11 05:43:11.228 [rank:7] [eval], epoch: 32/50, iter: 125/125, loss: 0.00000, lr: 0.398013, top1: 0.68096, throughput: 479.90 | 2022-04-11 05:43:11.229 [rank:4] [eval], epoch: 32/50, iter: 125/125, loss: 0.00000, lr: 0.398013, top1: 0.67728, throughput: 480.27 | 2022-04-11 05:43:11.243 [rank:3] [eval], epoch: 32/50, iter: 125/125, loss: 0.00000, lr: 0.398013, top1: 0.67344, throughput: 480.22 | 2022-04-11 05:43:11.245 [rank:6] [eval], epoch: 32/50, iter: 125/125, loss: 0.00000, lr: 0.398013, top1: 0.68400, throughput: 481.12 | 2022-04-11 05:43:11.247 [rank:7] [train], epoch: 33/50, iter: 100/834, loss: 0.28909, lr: 0.392953, top1: 0.66661, throughput: 313.80 | 2022-04-11 05:44:12.414 [rank:5] [train], epoch: 33/50, iter: 100/834, loss: 0.28476, lr: 0.392953, top1: 0.68229, throughput: 313.71 | 2022-04-11 05:44:12.431 [rank:6] [train], epoch: 33/50, iter: 100/834, loss: 0.28639, lr: 0.392953, top1: 0.67380, throughput: 313.76 | 2022-04-11 05:44:12.440 [rank:2] [train], epoch: 33/50, iter: 100/834, loss: 0.28618, lr: 0.392953, top1: 0.67943, throughput: 313.48 | 2022-04-11 05:44:12.465 [rank:4] [train], epoch: 33/50, iter: 100/834, loss: 0.28829, lr: 0.392953, top1: 0.67792, throughput: 313.61 | 2022-04-11 05:44:12.465 [rank:3] [train], epoch: 33/50, iter: 100/834, loss: 0.28438, lr: 0.392953, top1: 0.68146, throughput: 313.51 | 2022-04-11 05:44:12.487 [rank:0] [train], epoch: 33/50, iter: 100/834, loss: 0.28619, lr: 0.392953, top1: 0.67234, throughput: 313.21 | 2022-04-11 05:44:12.508 [rank:1] [train], epoch: 33/50, iter: 100/834, loss: 0.28434, lr: 0.392953, top1: 0.68260, throughput: 313.63 | 2022-04-11 05:44:12.427 [rank:5] [train], epoch: 33/50, iter: 200/834, loss: 0.28906, lr: 0.387915, top1: 0.67182, throughput: 312.29 | 2022-04-11 05:45:13.912 [rank:2] [train], epoch: 33/50, iter: 200/834, loss: 0.29129, lr: 0.387915, top1: 0.66781, throughput: 312.40 | 2022-04-11 05:45:13.924 [rank:1] [train], epoch: 33/50, iter: 200/834, loss: 0.28455, lr: 0.387915, top1: 0.68417, throughput: 312.17 | 2022-04-11 05:45:13.933 [rank:0] [train], epoch: 33/50, iter: 200/834, loss: 0.28790, lr: 0.387915, top1: 0.67130, throughput: 312.43 | 2022-04-11 05:45:13.962 [rank:4] [train], epoch: 33/50, iter: 200/834, loss: 0.28631, lr: 0.387915, top1: 0.67687, throughput: 312.17 | 2022-04-11 05:45:13.969 [rank:6] [train], epoch: 33/50, iter: 200/834, loss: 0.28983, lr: 0.387915, top1: 0.66969, throughput: 311.99 | 2022-04-11 05:45:13.980 [rank:7] [train], epoch: 33/50, iter: 200/834, loss: 0.28638, lr: 0.387915, top1: 0.67589, throughput: 311.72 | 2022-04-11 05:45:14.007 [rank:3] [train], epoch: 33/50, iter: 200/834, loss: 0.28802, lr: 0.387915, top1: 0.67161, throughput: 311.97 | 2022-04-11 05:45:14.032 [rank:2] [train], epoch: 33/50, iter: 300/834, loss: 0.28765, lr: 0.382898, top1: 0.67161, throughput: 314.01 | 2022-04-11 05:46:15.068 [rank:5] [train], epoch: 33/50, iter: 300/834, loss: 0.28470, lr: 0.382898, top1: 0.68057, throughput: 313.86 | 2022-04-11 05:46:15.087 [rank:3] [train], epoch: 33/50, iter: 300/834, loss: 0.28648, lr: 0.382898, top1: 0.66974, throughput: 314.46 | 2022-04-11 05:46:15.089 [rank:0] [train], epoch: 33/50, iter: 300/834, loss: 0.28725, lr: 0.382898, top1: 0.66995, throughput: 314.07 | 2022-04-11 05:46:15.096 [rank:1] [train], epoch: 33/50, iter: 300/834, loss: 0.28748, lr: 0.382898, top1: 0.67505, throughput: 313.88 | 2022-04-11 05:46:15.102 [rank:6] [train], epoch: 33/50, iter: 300/834, loss: 0.28716, lr: 0.382898, top1: 0.67755, throughput: 314.11 | 2022-04-11 05:46:15.106 [rank:4] [train], epoch: 33/50, iter: 300/834, loss: 0.29036, lr: 0.382898, top1: 0.67245, throughput: 314.04 | 2022-04-11 05:46:15.108 [rank:7] [train], epoch: 33/50, iter: 300/834, loss: 0.29149, lr: 0.382898, top1: 0.66740, throughput: 313.95 | 2022-04-11 05:46:15.163 [rank:5] [train], epoch: 33/50, iter: 400/834, loss: 0.28923, lr: 0.377903, top1: 0.67292, throughput: 313.63 | 2022-04-11 05:47:16.305 [rank:0] [train], epoch: 33/50, iter: 400/834, loss: 0.28758, lr: 0.377903, top1: 0.67708, throughput: 313.43 | 2022-04-11 05:47:16.354 [rank:3] [train], epoch: 33/50, iter: 400/834, loss: 0.28919, lr: 0.377903, top1: 0.66828, throughput: 313.34 | 2022-04-11 05:47:16.365 [rank:6] [train], epoch: 33/50, iter: 400/834, loss: 0.28894, lr: 0.377903, top1: 0.67141, throughput: 313.42 | 2022-04-11 05:47:16.366 [rank:1] [train], epoch: 33/50, iter: 400/834, loss: 0.28606, lr: 0.377903, top1: 0.67615, throughput: 313.37 | 2022-04-11 05:47:16.372 [rank:2] [train], epoch: 33/50, iter: 400/834, loss: 0.28918, lr: 0.377903, top1: 0.67193, throughput: 313.19 | 2022-04-11 05:47:16.373 [rank:4] [train], epoch: 33/50, iter: 400/834, loss: 0.29035, lr: 0.377903, top1: 0.66833, throughput: 313.32 | 2022-04-11 05:47:16.386 [rank:7] [train], epoch: 33/50, iter: 400/834, loss: 0.29075, lr: 0.377903, top1: 0.66641, throughput: 313.98 | 2022-04-11 05:47:16.313 [rank:0] [train], epoch: 33/50, iter: 500/834, loss: 0.28885, lr: 0.372930, top1: 0.66828, throughput: 313.90 | 2022-04-11 05:48:17.520 [rank:6] [train], epoch: 33/50, iter: 500/834, loss: 0.28675, lr: 0.372930, top1: 0.67427, throughput: 313.90 | 2022-04-11 05:48:17.531 [rank:4] [train], epoch: 33/50, iter: 500/834, loss: 0.28810, lr: 0.372930, top1: 0.67042, throughput: 313.96 | 2022-04-11 05:48:17.541 [rank:5] [train], epoch: 33/50, iter: 500/834, loss: 0.28971, lr: 0.372930, top1: 0.66589, throughput: 313.55 | 2022-04-11 05:48:17.541 [rank:7] [train], epoch: 33/50, iter: 500/834, loss: 0.28964, lr: 0.372930, top1: 0.66635, throughput: 313.50 | 2022-04-11 05:48:17.557 [rank:3] [train], epoch: 33/50, iter: 500/834, loss: 0.28995, lr: 0.372930, top1: 0.66839, throughput: 313.73 | 2022-04-11 05:48:17.564 [rank:2] [train], epoch: 33/50, iter: 500/834, loss: 0.28952, lr: 0.372930, top1: 0.66797, throughput: 313.69 | 2022-04-11 05:48:17.580 [rank:1] [train], epoch: 33/50, iter: 500/834, loss: 0.28915, lr: 0.372930, top1: 0.67193, throughput: 313.62 | 2022-04-11 05:48:17.593 [rank:6] [train], epoch: 33/50, iter: 600/834, loss: 0.28732, lr: 0.367980, top1: 0.67380, throughput: 311.50 | 2022-04-11 05:49:19.170 [rank:2] [train], epoch: 33/50, iter: 600/834, loss: 0.28532, lr: 0.367980, top1: 0.68177, throughput: 311.68 | 2022-04-11 05:49:19.181 [rank:0] [train], epoch: 33/50, iter: 600/834, loss: 0.28682, lr: 0.367980, top1: 0.67609, throughput: 311.33 | 2022-04-11 05:49:19.191 [rank:7] [train], epoch: 33/50, iter: 600/834, loss: 0.28690, lr: 0.367980, top1: 0.67771, throughput: 311.46 | 2022-04-11 05:49:19.202 [rank:4] [train], epoch: 33/50, iter: 600/834, loss: 0.28757, lr: 0.367980, top1: 0.67208, throughput: 311.37 | 2022-04-11 05:49:19.204 [rank:3] [train], epoch: 33/50, iter: 600/834, loss: 0.29167, lr: 0.367980, top1: 0.66677, throughput: 311.46 | 2022-04-11 05:49:19.209 [rank:1] [train], epoch: 33/50, iter: 600/834, loss: 0.28834, lr: 0.367980, top1: 0.67125, throughput: 311.57 | 2022-04-11 05:49:19.216 [rank:5] [train], epoch: 33/50, iter: 600/834, loss: 0.28943, lr: 0.367980, top1: 0.67073, throughput: 311.59 | 2022-04-11 05:49:19.161 [rank:5] [train], epoch: 33/50, iter: 700/834, loss: 0.28906, lr: 0.363052, top1: 0.67057, throughput: 313.20 | 2022-04-11 05:50:20.464 [rank:7] [train], epoch: 33/50, iter: 700/834, loss: 0.28995, lr: 0.363052, top1: 0.66474, throughput: 313.22 | 2022-04-11 05:50:20.501 [rank:0] [train], epoch: 33/50, iter: 700/834, loss: 0.28849, lr: 0.363052, top1: 0.66932, throughput: 313.11 | 2022-04-11 05:50:20.511 [rank:3] [train], epoch: 33/50, iter: 700/834, loss: 0.28980, lr: 0.363052, top1: 0.66813, throughput: 313.19 | 2022-04-11 05:50:20.515 [rank:4] [train], epoch: 33/50, iter: 700/834, loss: 0.29004, lr: 0.363052, top1: 0.66755, throughput: 313.13 | 2022-04-11 05:50:20.521 [rank:1] [train], epoch: 33/50, iter: 700/834, loss: 0.28996, lr: 0.363052, top1: 0.66844, throughput: 313.18 | 2022-04-11 05:50:20.524 [rank:6] [train], epoch: 33/50, iter: 700/834, loss: 0.29053, lr: 0.363052, top1: 0.66802, throughput: 312.89 | 2022-04-11 05:50:20.533 [rank:2] [train], epoch: 33/50, iter: 700/834, loss: 0.28901, lr: 0.363052, top1: 0.66974, throughput: 312.84 | 2022-04-11 05:50:20.555 [rank:4] [train], epoch: 33/50, iter: 800/834, loss: 0.28900, lr: 0.358147, top1: 0.66875, throughput: 314.11 | 2022-04-11 05:51:21.646 [rank:6] [train], epoch: 33/50, iter: 800/834, loss: 0.28690, lr: 0.358147, top1: 0.67505, throughput: 314.16 | 2022-04-11 05:51:21.649 [rank:1] [train], epoch: 33/50, iter: 800/834, loss: 0.29023, lr: 0.358147, top1: 0.66688, throughput: 314.05 | 2022-04-11 05:51:21.661 [rank:3] [train], epoch: 33/50, iter: 800/834, loss: 0.28987, lr: 0.358147, top1: 0.66844, throughput: 313.90 | 2022-04-11 05:51:21.680 [rank:2] [train], epoch: 33/50, iter: 800/834, loss: 0.29079, lr: 0.358147, top1: 0.66547, throughput: 314.06 | 2022-04-11 05:51:21.690 [rank:5] [train], epoch: 33/50, iter: 800/834, loss: 0.28876, lr: 0.358147, top1: 0.67115, throughput: 313.54 | 2022-04-11 05:51:21.699 [rank:0] [train], epoch: 33/50, iter: 800/834, loss: 0.28942, lr: 0.358147, top1: 0.66750, throughput: 314.10 | 2022-04-11 05:51:21.637 [rank:7] [train], epoch: 33/50, iter: 800/834, loss: 0.28905, lr: 0.358147, top1: 0.66896, throughput: 313.70 | 2022-04-11 05:51:21.706 [rank:5] [train], epoch: 33/50, iter: 834/834, loss: 0.29139, lr: 0.356485, top1: 0.66544, throughput: 312.42 | 2022-04-11 05:51:42.594 [rank:7] [train], epoch: 33/50, iter: 834/834, loss: 0.28375, lr: 0.356485, top1: 0.67984, throughput: 312.41 | 2022-04-11 05:51:42.602 [rank:6] [train], epoch: 33/50, iter: 834/834, loss: 0.28850, lr: 0.356485, top1: 0.67433, throughput: 311.53 | 2022-04-11 05:51:42.603 [rank:1] [train], epoch: 33/50, iter: 834/834, loss: 0.29318, lr: 0.356485, top1: 0.65763, throughput: 311.71 | 2022-04-11 05:51:42.603 [rank:3] [train], epoch: 33/50, iter: 834/834, loss: 0.28960, lr: 0.356485, top1: 0.66896, throughput: 311.98 | 2022-04-11 05:51:42.604 [rank:4] [train], epoch: 33/50, iter: 834/834, loss: 0.29189, lr: 0.356485, top1: 0.66881, throughput: 311.47 | 2022-04-11 05:51:42.605 [rank:0] [train], epoch: 33/50, iter: 834/834, loss: 0.29340, lr: 0.356485, top1: 0.66284, throughput: 310.93 | 2022-04-11 05:51:42.633 [rank:2] [train], epoch: 33/50, iter: 834/834, loss: 0.29161, lr: 0.356485, top1: 0.66054, throughput: 311.48 | 2022-04-11 05:51:42.648 [rank:0] [eval], epoch: 33/50, iter: 125/125, loss: 0.00000, lr: 0.356485, top1: 0.68400, throughput: 487.38 | 2022-04-11 05:51:55.456 [rank:1] [eval], epoch: 33/50, iter: 125/125, loss: 0.00000, lr: 0.356485, top1: 0.68016, throughput: 485.98 | 2022-04-11 05:51:55.464 [rank:2] [eval], epoch: 33/50, iter: 125/125, loss: 0.00000, lr: 0.356485, top1: 0.67376, throughput: 487.55 | 2022-04-11 05:51:55.467 [rank:5] [eval], epoch: 33/50, iter: 125/125, loss: 0.00000, lr: 0.356485, top1: 0.67152, throughput: 485.27 | 2022-04-11 05:51:55.473 [rank:7] [eval], epoch: 33/50, iter: 125/125, loss: 0.00000, lr: 0.356485, top1: 0.66928, throughput: 485.49 | 2022-04-11 05:51:55.476 [rank:3] [eval], epoch: 33/50, iter: 125/125, loss: 0.00000, lr: 0.356485, top1: 0.67504, throughput: 484.58 | 2022-04-11 05:51:55.502 [rank:4] [eval], epoch: 33/50, iter: 125/125, loss: 0.00000, lr: 0.356485, top1: 0.67344, throughput: 484.47 | 2022-04-11 05:51:55.505 [rank:6] [eval], epoch: 33/50, iter: 125/125, loss: 0.00000, lr: 0.356485, top1: 0.67920, throughput: 484.37 | 2022-04-11 05:51:55.506 [rank:2] [train], epoch: 34/50, iter: 100/834, loss: 0.28449, lr: 0.351612, top1: 0.68354, throughput: 313.16 | 2022-04-11 05:52:56.777 [rank:5] [train], epoch: 34/50, iter: 100/834, loss: 0.28475, lr: 0.351612, top1: 0.67776, throughput: 313.17 | 2022-04-11 05:52:56.782 [rank:1] [train], epoch: 34/50, iter: 100/834, loss: 0.28312, lr: 0.351612, top1: 0.68281, throughput: 313.07 | 2022-04-11 05:52:56.793 [rank:7] [train], epoch: 34/50, iter: 100/834, loss: 0.27948, lr: 0.351612, top1: 0.68646, throughput: 313.05 | 2022-04-11 05:52:56.807 [rank:6] [train], epoch: 34/50, iter: 100/834, loss: 0.28684, lr: 0.351612, top1: 0.67318, throughput: 313.14 | 2022-04-11 05:52:56.822 [rank:4] [train], epoch: 34/50, iter: 100/834, loss: 0.28526, lr: 0.351612, top1: 0.67969, throughput: 313.13 | 2022-04-11 05:52:56.822 [rank:0] [train], epoch: 34/50, iter: 100/834, loss: 0.28221, lr: 0.351612, top1: 0.68766, throughput: 312.88 | 2022-04-11 05:52:56.822 [rank:3] [train], epoch: 34/50, iter: 100/834, loss: 0.27996, lr: 0.351612, top1: 0.68750, throughput: 313.37 | 2022-04-11 05:52:56.771 [rank:6] [train], epoch: 34/50, iter: 200/834, loss: 0.28311, lr: 0.346762, top1: 0.68057, throughput: 313.40 | 2022-04-11 05:53:58.084 [rank:2] [train], epoch: 34/50, iter: 200/834, loss: 0.28295, lr: 0.346762, top1: 0.68120, throughput: 313.06 | 2022-04-11 05:53:58.108 [rank:5] [train], epoch: 34/50, iter: 200/834, loss: 0.28281, lr: 0.346762, top1: 0.68297, throughput: 312.89 | 2022-04-11 05:53:58.145 [rank:1] [train], epoch: 34/50, iter: 200/834, loss: 0.28382, lr: 0.346762, top1: 0.67891, throughput: 312.92 [rank:4] [train], epoch: 34/50, iter: 200/834, loss: 0.28324, lr: 0.346762, top1: 0.67891, throughput: 313.06| 2022-04-11 05:53:58.151 | 2022-04-11 05:53:58.152 [rank:0] [train], epoch: 34/50, iter: 200/834, loss: 0.28350, lr: 0.346762, top1: 0.67948, throughput: 313.06 | 2022-04-11 05:53:58.152 [rank:7] [train], epoch: 34/50, iter: 200/834, loss: 0.28035, lr: 0.346762, top1: 0.68714, throughput: 312.92 | 2022-04-11 05:53:58.165 [rank:3] [train], epoch: 34/50, iter: 200/834, loss: 0.28270, lr: 0.346762, top1: 0.68135, throughput: 312.56 | 2022-04-11 05:53:58.199 [rank:5] [train], epoch: 34/50, iter: 300/834, loss: 0.28322, lr: 0.341936, top1: 0.68365, throughput: 312.53 | 2022-04-11 05:54:59.579 [rank:0] [train], epoch: 34/50, iter: 300/834, loss: 0.28141, lr: 0.341936, top1: 0.68625, throughput: 312.44 | 2022-04-11 05:54:59.603 [rank:7] [train], epoch: 34/50, iter: 300/834, loss: 0.28261, lr: 0.341936, top1: 0.68635, throughput: 312.43 | 2022-04-11 05:54:59.618 [rank:4] [train], epoch: 34/50, iter: 300/834, loss: 0.28628, lr: 0.341936, top1: 0.67490, throughput: 312.36 | 2022-04-11 05:54:59.619 [rank:6] [train], epoch: 34/50, iter: 300/834, loss: 0.28425, lr: 0.341936, top1: 0.67984, throughput: 312.01 | 2022-04-11 05:54:59.620 [rank:1] [train], epoch: 34/50, iter: 300/834, loss: 0.28537, lr: 0.341936, top1: 0.67990, throughput: 312.28 | 2022-04-11 05:54:59.634 [rank:3] [train], epoch: 34/50, iter: 300/834, loss: 0.28535, lr: 0.341936, top1: 0.68161, throughput: 312.41 | 2022-04-11 05:54:59.656 [rank:2] [train], epoch: 34/50, iter: 300/834, loss: 0.28532, lr: 0.341936, top1: 0.67755, throughput: 311.92 | 2022-04-11 05:54:59.662 [rank:4] [train], epoch: 34/50, iter: 400/834, loss: 0.28692, lr: 0.337134, top1: 0.67354, throughput: 313.47 | 2022-04-11 05:56:00.869 [rank:1] [train], epoch: 34/50, iter: 400/834, loss: 0.28652, lr: 0.337134, top1: 0.67552, throughput: 313.53 | 2022-04-11 05:56:00.872 [rank:3] [train], epoch: 34/50, iter: 400/834, loss: 0.28439, lr: 0.337134, top1: 0.68224, throughput: 313.61 | 2022-04-11 05:56:00.879 [rank:6] [train], epoch: 34/50, iter: 400/834, loss: 0.28546, lr: 0.337134, top1: 0.67500, throughput: 313.21 | 2022-04-11 05:56:00.920 [rank:5] [train], epoch: 34/50, iter: 400/834, loss: 0.28560, lr: 0.337134, top1: 0.67875, throughput: 313.40 | 2022-04-11 05:56:00.842 [rank:0] [train], epoch: 34/50, iter: 400/834, loss: 0.28712, lr: 0.337134, top1: 0.67609, throughput: 313.04 | 2022-04-11 05:56:00.938 [rank:7] [train], epoch: 34/50, iter: 400/834, loss: 0.28551, lr: 0.337134, top1: 0.67677, throughput: 313.10 | 2022-04-11 05:56:00.940 [rank:2] [train], epoch: 34/50, iter: 400/834, loss: 0.28742, lr: 0.337134, top1: 0.67135, throughput: 313.25 | 2022-04-11 05:56:00.955 [rank:2] [train], epoch: 34/50, iter: 500/834, loss: 0.28376, lr: 0.332357, top1: 0.68245, throughput: 311.77 | 2022-04-11 05:57:02.538 [rank:6] [train], epoch: 34/50, iter: 500/834, loss: 0.28520, lr: 0.332357, top1: 0.67859, throughput: 311.60 | 2022-04-11 05:57:02.539 [rank:3] [train], epoch: 34/50, iter: 500/834, loss: 0.28425, lr: 0.332357, top1: 0.68193, throughput: 311.38 | 2022-04-11 05:57:02.539 [rank:4] [train], epoch: 34/50, iter: 500/834, loss: 0.28496, lr: 0.332357, top1: 0.67823, throughput: 311.16 | 2022-04-11 05:57:02.572 [rank:1] [train], epoch: 34/50, iter: 500/834, loss: 0.28300, lr: 0.332357, top1: 0.68021, throughput: 311.14 | 2022-04-11 05:57:02.582 [rank:5] [train], epoch: 34/50, iter: 500/834, loss: 0.28296, lr: 0.332357, top1: 0.68286, throughput: 310.94 | 2022-04-11 05:57:02.591 [rank:7] [train], epoch: 34/50, iter: 500/834, loss: 0.28399, lr: 0.332357, top1: 0.68026, throughput: 311.41 | 2022-04-11 05:57:02.594 [rank:0] [train], epoch: 34/50, iter: 500/834, loss: 0.28674, lr: 0.332357, top1: 0.67255, throughput: 311.29 | 2022-04-11 05:57:02.617 [rank:5] [train], epoch: 34/50, iter: 600/834, loss: 0.28384, lr: 0.327604, top1: 0.67938, throughput: 315.32 | 2022-04-11 05:58:03.482 [rank:1] [train], epoch: 34/50, iter: 600/834, loss: 0.28387, lr: 0.327604, top1: 0.68177, throughput: 315.18 | 2022-04-11 05:58:03.499 [rank:3] [train], epoch: 34/50, iter: 600/834, loss: 0.28392, lr: 0.327604, top1: 0.68312, throughput: 314.94 | 2022-04-11 05:58:03.503 [rank:2] [train], epoch: 34/50, iter: 600/834, loss: 0.28669, lr: 0.327604, top1: 0.67682, throughput: 314.86 | 2022-04-11 05:58:03.518 [rank:4] [train], epoch: 34/50, iter: 600/834, loss: 0.28360, lr: 0.327604, top1: 0.67719, throughput: 314.98 | 2022-04-11 05:58:03.528 [rank:6] [train], epoch: 34/50, iter: 600/834, loss: 0.28272, lr: 0.327604, top1: 0.68536, throughput: 314.81 | 2022-04-11 05:58:03.528 [rank:7] [train], epoch: 34/50, iter: 600/834, loss: 0.28629, lr: 0.327604, top1: 0.67771, throughput: 314.98 | 2022-04-11 05:58:03.551 [rank:0] [train], epoch: 34/50, iter: 600/834, loss: 0.28532, lr: 0.327604, top1: 0.67813, throughput: 315.06 | 2022-04-11 05:58:03.558 [rank:4] [train], epoch: 34/50, iter: 700/834, loss: 0.28632, lr: 0.322876, top1: 0.67500, throughput: 312.41 | 2022-04-11 05:59:04.986 [rank:6] [train], epoch: 34/50, iter: 700/834, loss: 0.28536, lr: 0.322876, top1: 0.67833, throughput: 312.16 | 2022-04-11 05:59:05.035 [rank:3] [train], epoch: 34/50, iter: 700/834, loss: 0.28511, lr: 0.322876, top1: 0.67875, throughput: 311.83 | 2022-04-11 05:59:05.076 [rank:7] [train], epoch: 34/50, iter: 700/834, loss: 0.28237, lr: 0.322876, top1: 0.68521, throughput: 312.06 | 2022-04-11 05:59:05.077 [rank:5] [train], epoch: 34/50, iter: 700/834, loss: 0.28421, lr: 0.322876, top1: 0.67854, throughput: 311.70 | 2022-04-11 05:59:05.079 [rank:2] [train], epoch: 34/50, iter: 700/834, loss: 0.28355, lr: 0.322876, top1: 0.68042, throughput: 312.18 | 2022-04-11 05:59:05.021 [rank:0] [train], epoch: 34/50, iter: 700/834, loss: 0.28535, lr: 0.322876, top1: 0.68078, throughput: 311.88 | 2022-04-11 05:59:05.119 [rank:1] [train], epoch: 34/50, iter: 700/834, loss: 0.28392, lr: 0.322876, top1: 0.67792, throughput: 312.08 | 2022-04-11 05:59:05.022 [rank:7] [train], epoch: 34/50, iter: 800/834, loss: 0.28580, lr: 0.318174, top1: 0.67490, throughput: 312.95 | 2022-04-11 06:00:06.429 [rank:2] [train], epoch: 34/50, iter: 800/834, loss: 0.28473, lr: 0.318174, top1: 0.68078, throughput: 312.62 | 2022-04-11 06:00:06.438 [rank:5] [train], epoch: 34/50, iter: 800/834, loss: 0.28417, lr: 0.318174, top1: 0.67896, throughput: 312.90 | 2022-04-11 06:00:06.441 [rank:1] [train], epoch: 34/50, iter: 800/834, loss: 0.28455, lr: 0.318174, top1: 0.68057, throughput: 312.58 | 2022-04-11 06:00:06.446 [rank:4] [train], epoch: 34/50, iter: 800/834, loss: 0.28439, lr: 0.318174, top1: 0.67641, throughput: 312.39 | 2022-04-11 06:00:06.447 [rank:6] [train], epoch: 34/50, iter: 800/834, loss: 0.28532, lr: 0.318174, top1: 0.67411, throughput: 312.56 | 2022-04-11 06:00:06.463 [rank:0] [train], epoch: 34/50, iter: 800/834, loss: 0.28408, lr: 0.318174, top1: 0.68443, throughput: 312.85 | 2022-04-11 06:00:06.491 [rank:3] [train], epoch: 34/50, iter: 800/834, loss: 0.28324, lr: 0.318174, top1: 0.68120, throughput: 312.57 | 2022-04-11 06:00:06.502 [rank:5] [train], epoch: 34/50, iter: 834/834, loss: 0.28369, lr: 0.316581, top1: 0.68582, throughput: 312.56 | 2022-04-11 06:00:27.327 [rank:7] [train], epoch: 34/50, iter: 834/834, loss: 0.28444, lr: 0.316581, top1: 0.67525, throughput: 312.19 | 2022-04-11 06:00:27.339 [rank:1] [train], epoch: 34/50, iter: 834/834, loss: 0.28341, lr: 0.316581, top1: 0.68183, throughput: 312.44 | 2022-04-11 06:00:27.340 [rank:6] [train], epoch: 34/50, iter: 834/834, loss: 0.28211, lr: 0.316581, top1: 0.67984, throughput: 312.67 | 2022-04-11 06:00:27.341 [rank:0] [train], epoch: 34/50, iter: 834/834, loss: 0.28668, lr: 0.316581, top1: 0.67570, throughput: 313.07 | 2022-04-11 06:00:27.343 [rank:3] [train], epoch: 34/50, iter: 834/834, loss: 0.28596, lr: 0.316581, top1: 0.67402, throughput: 313.00 | 2022-04-11 06:00:27.358 [rank:4] [train], epoch: 34/50, iter: 834/834, loss: 0.28241, lr: 0.316581, top1: 0.68949, throughput: 312.01 | 2022-04-11 06:00:27.369 [rank:2] [train], epoch: 34/50, iter: 834/834, loss: 0.28382, lr: 0.316581, top1: 0.67739, throughput: 311.66 | 2022-04-11 06:00:27.384 [rank:0] [eval], epoch: 34/50, iter: 125/125, loss: 0.00000, lr: 0.316581, top1: 0.69344, throughput: 483.57 | 2022-04-11 06:00:40.268 [rank:1] [eval], epoch: 34/50, iter: 125/125, loss: 0.00000, lr: 0.316581, top1: 0.69088, throughput: 483.04 | 2022-04-11 06:00:40.278 [rank:2] [eval], epoch: 34/50, iter: 125/125, loss: 0.00000, lr: 0.316581, top1: 0.68064, throughput: 484.58 | 2022-04-11 06:00:40.281 [rank:7] [eval], epoch: 34/50, iter: 125/125, loss: 0.00000, lr: 0.316581, top1: 0.69216, throughput: 482.75 | 2022-04-11 06:00:40.286 [rank:5] [eval], epoch: 34/50, iter: 125/125, loss: 0.00000, lr: 0.316581, top1: 0.69008, throughput: 482.22 | 2022-04-11 06:00:40.288 [rank:6] [eval], epoch: 34/50, iter: 125/125, loss: 0.00000, lr: 0.316581, top1: 0.68928, throughput: 482.36 | 2022-04-11 06:00:40.298 [rank:4] [eval], epoch: 34/50, iter: 125/125, loss: 0.00000, lr: 0.316581, top1: 0.68368, throughput: 482.72 | 2022-04-11 06:00:40.316 [rank:3] [eval], epoch: 34/50, iter: 125/125, loss: 0.00000, lr: 0.316581, top1: 0.68960, throughput: 482.09 | 2022-04-11 06:00:40.322 [rank:6] [train], epoch: 35/50, iter: 100/834, loss: 0.27840, lr: 0.311913, top1: 0.69318, throughput: 313.98 | 2022-04-11 06:01:41.447 [rank:5] [train], epoch: 35/50, iter: 100/834, loss: 0.27858, lr: 0.311913, top1: 0.69016, throughput: 313.91 | 2022-04-11 06:01:41.451 [rank:7] [train], epoch: 35/50, iter: 100/834, loss: 0.27859, lr: 0.311913, top1: 0.69141, throughput: 313.83 | 2022-04-11 06:01:41.465 [rank:2] [train], epoch: 35/50, iter: 100/834, loss: 0.28055, lr: 0.311913, top1: 0.68885, throughput: 313.80 | 2022-04-11 06:01:41.466 [rank:0] [train], epoch: 35/50, iter: 100/834, loss: 0.27663, lr: 0.311913, top1: 0.69589, throughput: 313.45 | 2022-04-11 06:01:41.521 [rank:1] [train], epoch: 35/50, iter: 100/834, loss: 0.27819, lr: 0.311913, top1: 0.69354, throughput: 313.48 | 2022-04-11 06:01:41.526 [rank:3] [train], epoch: 35/50, iter: 100/834, loss: 0.28174, lr: 0.311913, top1: 0.68776, throughput: 313.55 | 2022-04-11 06:01:41.556 [rank:4] [train], epoch: 35/50, iter: 100/834, loss: 0.27716, lr: 0.311913, top1: 0.69479, throughput: 313.41 | 2022-04-11 06:01:41.577 [rank:6] [train], epoch: 35/50, iter: 200/834, loss: 0.27767, lr: 0.307271, top1: 0.69391, throughput: 312.12 | 2022-04-11 06:02:42.962 [rank:7] [train], epoch: 35/50, iter: 200/834, loss: 0.28152, lr: 0.307271, top1: 0.68578, throughput: 312.18 | 2022-04-11 06:02:42.969 [rank:5] [train], epoch: 35/50, iter: 200/834, loss: 0.27849, lr: 0.307271, top1: 0.69109, throughput: 312.10 | 2022-04-11 06:02:42.970 [rank:0] [train], epoch: 35/50, iter: 200/834, loss: 0.28054, lr: 0.307271, top1: 0.68833, throughput: 312.45 | 2022-04-11 06:02:42.971 [rank:4] [train], epoch: 35/50, iter: 200/834, loss: 0.27787, lr: 0.307271, top1: 0.69182, throughput: 312.57 | 2022-04-11 06:02:43.003 [rank:1] [train], epoch: 35/50, iter: 200/834, loss: 0.28154, lr: 0.307271, top1: 0.68865, throughput: 312.21 | 2022-04-11 06:02:43.024 [rank:3] [train], epoch: 35/50, iter: 200/834, loss: 0.28002, lr: 0.307271, top1: 0.69135, throughput: 312.32 | 2022-04-11 06:02:43.030 [rank:2] [train], epoch: 35/50, iter: 200/834, loss: 0.28107, lr: 0.307271, top1: 0.68302, throughput: 311.82 | 2022-04-11 06:02:43.040 [rank:4] [train], epoch: 35/50, iter: 300/834, loss: 0.27992, lr: 0.302655, top1: 0.68464, throughput: 313.54 | 2022-04-11 06:03:44.239 [rank:7] [train], epoch: 35/50, iter: 300/834, loss: 0.28245, lr: 0.302655, top1: 0.68474, throughput: 313.15 | 2022-04-11 06:03:44.282 [rank:0] [train], epoch: 35/50, iter: 300/834, loss: 0.28056, lr: 0.302655, top1: 0.68266, throughput: 313.15 | 2022-04-11 06:03:44.284 [rank:6] [train], epoch: 35/50, iter: 300/834, loss: 0.27918, lr: 0.302655, top1: 0.68917, throughput: 313.04 | 2022-04-11 06:03:44.295 [rank:2] [train], epoch: 35/50, iter: 300/834, loss: 0.28062, lr: 0.302655, top1: 0.68594, throughput: 313.32 | 2022-04-11 06:03:44.319 [rank:5] [train], epoch: 35/50, iter: 300/834, loss: 0.28032, lr: 0.302655, top1: 0.68943, throughput: 312.93 | 2022-04-11 06:03:44.326 [rank:3] [train], epoch: 35/50, iter: 300/834, loss: 0.27972, lr: 0.302655, top1: 0.68849, throughput: 313.19 | 2022-04-11 06:03:44.335 [rank:1] [train], epoch: 35/50, iter: 300/834, loss: 0.28308, lr: 0.302655, top1: 0.67859, throughput: 313.15 | 2022-04-11 06:03:44.336 [rank:2] [train], epoch: 35/50, iter: 400/834, loss: 0.28166, lr: 0.298065, top1: 0.68391, throughput: 315.67 | 2022-04-11 06:04:45.143 [rank:4] [train], epoch: 35/50, iter: 400/834, loss: 0.28040, lr: 0.298065, top1: 0.68469, throughput: 315.02 | 2022-04-11 06:04:45.187 [rank:1] [train], epoch: 35/50, iter: 400/834, loss: 0.28193, lr: 0.298065, top1: 0.68635, throughput: 315.41 | 2022-04-11 06:04:45.210 [rank:6] [train], epoch: 35/50, iter: 400/834, loss: 0.27977, lr: 0.298065, top1: 0.69031, throughput: 315.07 | 2022-04-11 06:04:45.234 [rank:5] [train], epoch: 35/50, iter: 400/834, loss: 0.28179, lr: 0.298065, top1: 0.68849, throughput: 315.23 | 2022-04-11 06:04:45.234 [rank:3] [train], epoch: 35/50, iter: 400/834, loss: 0.28145, lr: 0.298065, top1: 0.68573, throughput: 315.23 | 2022-04-11 06:04:45.243 [rank:0] [train], epoch: 35/50, iter: 400/834, loss: 0.28346, lr: 0.298065, top1: 0.68172, throughput: 314.87 | 2022-04-11 06:04:45.262 [rank:7] [train], epoch: 35/50, iter: 400/834, loss: 0.27928, lr: 0.298065, top1: 0.68995, throughput: 314.80 | 2022-04-11 06:04:45.272 [rank:4] [train], epoch: 35/50, iter: 500/834, loss: 0.27996, lr: 0.293502, top1: 0.68698, throughput: 312.74 | 2022-04-11 06:05:46.579 [rank:1] [train], epoch: 35/50, iter: 500/834, loss: 0.28236, lr: 0.293502, top1: 0.68333, throughput: 312.82 | 2022-04-11 06:05:46.587 [rank:2] [train], epoch: 35/50, iter: 500/834, loss: 0.28202, lr: 0.293502, top1: 0.68615, throughput: 312.41 | 2022-04-11 06:05:46.599 [rank:0] [train], epoch: 35/50, iter: 500/834, loss: 0.27952, lr: 0.293502, top1: 0.69281, throughput: 312.96 | 2022-04-11 06:05:46.612 [rank:6] [train], epoch: 35/50, iter: 500/834, loss: 0.28261, lr: 0.293502, top1: 0.68333, throughput: 312.72 | 2022-04-11 06:05:46.630 [rank:5] [train], epoch: 35/50, iter: 500/834, loss: 0.28257, lr: 0.293502, top1: 0.68573, throughput: 312.70 | 2022-04-11 06:05:46.636 [rank:7] [train], epoch: 35/50, iter: 500/834, loss: 0.28089, lr: 0.293502, top1: 0.69010, throughput: 312.82 | 2022-04-11 06:05:46.650 [rank:3] [train], epoch: 35/50, iter: 500/834, loss: 0.28035, lr: 0.293502, top1: 0.68901, throughput: 312.59 | 2022-04-11 06:05:46.667 [rank:4] [train], epoch: 35/50, iter: 600/834, loss: 0.27967, lr: 0.288966, top1: 0.68932, throughput: 312.76 | 2022-04-11 06:06:47.969 [rank:6] [train], epoch: 35/50, iter: 600/834, loss: 0.27979, lr: 0.288966, top1: 0.68745, throughput: 312.89 | 2022-04-11 06:06:47.993 [rank:0] [train], epoch: 35/50, iter: 600/834, loss: 0.27825, lr: 0.288966, top1: 0.69370, throughput: 312.69 | 2022-04-11 06:06:48.013 [rank:1] [train], epoch: 35/50, iter: 600/834, loss: 0.28132, lr: 0.288966, top1: 0.68760, throughput: 312.53 | 2022-04-11 06:06:48.020 [rank:5] [train], epoch: 35/50, iter: 600/834, loss: 0.27992, lr: 0.288966, top1: 0.68641, throughput: 312.73 | 2022-04-11 06:06:48.031 [rank:2] [train], epoch: 35/50, iter: 600/834, loss: 0.28147, lr: 0.288966, top1: 0.68359, throughput: 312.54 | 2022-04-11 06:06:48.031 [rank:3] [train], epoch: 35/50, iter: 600/834, loss: 0.28018, lr: 0.288966, top1: 0.68604, throughput: 312.82 | 2022-04-11 06:06:48.043 [rank:7] [train], epoch: 35/50, iter: 600/834, loss: 0.27856, lr: 0.288966, top1: 0.69260, throughput: 313.10 | 2022-04-11 06:06:47.971 [rank:2] [train], epoch: 35/50, iter: 700/834, loss: 0.28110, lr: 0.284457, top1: 0.68453, throughput: 313.76 | 2022-04-11 06:07:49.224 [rank:3] [train], epoch: 35/50, iter: 700/834, loss: 0.27947, lr: 0.284457, top1: 0.68833, throughput: 313.78 | 2022-04-11 06:07:49.232 [rank:7] [train], epoch: 35/50, iter: 700/834, loss: 0.28049, lr: 0.284457, top1: 0.68500, throughput: 313.40 | 2022-04-11 06:07:49.235 [rank:6] [train], epoch: 35/50, iter: 700/834, loss: 0.27852, lr: 0.284457, top1: 0.69036, throughput: 313.42 | 2022-04-11 06:07:49.253[rank:1] [train], epoch: 35/50, iter: 700/834, loss: 0.27880, lr: 0.284457, top1: 0.69057, throughput: 313.56 | 2022-04-11 06:07:49.252 [rank:5] [train], epoch: 35/50, iter: 700/834, loss: 0.27877, lr: 0.284457, top1: 0.68969, throughput: 313.61 | 2022-04-11 06:07:49.253 [rank:4] [train], epoch: 35/50, iter: 700/834, loss: 0.28281, lr: 0.284457, top1: 0.68188, throughput: 313.20 | 2022-04-11 06:07:49.272 [rank:0] [train], epoch: 35/50, iter: 700/834, loss: 0.27963, lr: 0.284457, top1: 0.69359, throughput: 313.37 | 2022-04-11 06:07:49.283 [rank:5] [train], epoch: 35/50, iter: 800/834, loss: 0.27786, lr: 0.279976, top1: 0.69135, throughput: 311.34 | 2022-04-11 06:08:50.922 [rank:3] [train], epoch: 35/50, iter: 800/834, loss: 0.28134, lr: 0.279976, top1: 0.68865, throughput: 311.17 | 2022-04-11 06:08:50.935 [rank:0] [train], epoch: 35/50, iter: 800/834, loss: 0.27945, lr: 0.279976, top1: 0.69177, throughput: 311.34 | 2022-04-11 06:08:50.951 [rank:4] [train], epoch: 35/50, iter: 800/834, loss: 0.28072, lr: 0.279976, top1: 0.68807, throughput: 311.21 | 2022-04-11 06:08:50.966 [rank:6] [train], epoch: 35/50, iter: 800/834, loss: 0.28123, lr: 0.279976, top1: 0.68594, throughput: 311.11 | 2022-04-11 06:08:50.968 [rank:1] [train], epoch: 35/50, iter: 800/834, loss: 0.27814, lr: 0.279976, top1: 0.69339, throughput: 311.05 | 2022-04-11 06:08:50.979 [rank:7] [train], epoch: 35/50, iter: 800/834, loss: 0.28126, lr: 0.279976, top1: 0.68297, throughput: 310.92 | 2022-04-11 06:08:50.987 [rank:2] [train], epoch: 35/50, iter: 800/834, loss: 0.27953, lr: 0.279976, top1: 0.68891, throughput: 310.83 | 2022-04-11 06:08:50.994 [rank:4] [train], epoch: 35/50, iter: 834/834, loss: 0.28105, lr: 0.278458, top1: 0.68336, throughput: 309.99 | 2022-04-11 06:09:12.025 [rank:5] [train], epoch: 35/50, iter: 834/834, loss: 0.28229, lr: 0.278458, top1: 0.68627, throughput: 309.20 | 2022-04-11 06:09:12.035 [rank:1] [train], epoch: 35/50, iter: 834/834, loss: 0.27488, lr: 0.278458, top1: 0.69317, throughput: 310.01 | 2022-04-11 06:09:12.037 [rank:7] [train], epoch: 35/50, iter: 834/834, loss: 0.28359, lr: 0.278458, top1: 0.68382, throughput: 310.10 | 2022-04-11 06:09:12.038 [rank:0] [train], epoch: 35/50, iter: 834/834, loss: 0.28058, lr: 0.278458, top1: 0.68704, throughput: 309.48 | 2022-04-11 06:09:12.044 [rank:2] [train], epoch: 35/50, iter: 834/834, loss: 0.28002, lr: 0.278458, top1: 0.68398, throughput: 310.08 | 2022-04-11 06:09:12.047 [rank:3] [train], epoch: 35/50, iter: 834/834, loss: 0.27938, lr: 0.278458, top1: 0.68735, throughput: 308.98 | 2022-04-11 06:09:12.063 [rank:6] [train], epoch: 35/50, iter: 834/834, loss: 0.28428, lr: 0.278458, top1: 0.67953, throughput: 309.06 | 2022-04-11 06:09:12.090 [rank:0] [eval], epoch: 35/50, iter: 125/125, loss: 0.00000, lr: 0.278458, top1: 0.68288, throughput: 490.18 | 2022-04-11 06:09:24.795 [rank:1] [eval], epoch: 35/50, iter: 125/125, loss: 0.00000, lr: 0.278458, top1: 0.68880, throughput: 489.69 | 2022-04-11 06:09:24.800 [rank:2] [eval], epoch: 35/50, iter: 125/125, loss: 0.00000, lr: 0.278458, top1: 0.67328, throughput: 489.76 | 2022-04-11 06:09:24.808 [rank:5] [eval], epoch: 35/50, iter: 125/125, loss: 0.00000, lr: 0.278458, top1: 0.66832, throughput: 488.90 | 2022-04-11 06:09:24.819 [rank:7] [eval], epoch: 35/50, iter: 125/125, loss: 0.00000, lr: 0.278458, top1: 0.68032, throughput: 488.92 | 2022-04-11 06:09:24.821 [rank:4] [eval], epoch: 35/50, iter: 125/125, loss: 0.00000, lr: 0.278458, top1: 0.67088, throughput: 488.29 | 2022-04-11 06:09:24.825 [rank:6] [eval], epoch: 35/50, iter: 125/125, loss: 0.00000, lr: 0.278458, top1: 0.67200, throughput: 490.25 | 2022-04-11 06:09:24.838 [rank:3] [eval], epoch: 35/50, iter: 125/125, loss: 0.00000, lr: 0.278458, top1: 0.67472, throughput: 488.96 | 2022-04-11 06:09:24.845 [rank:4] [train], epoch: 36/50, iter: 100/834, loss: 0.27150, lr: 0.274014, top1: 0.70802, throughput: 312.68 | 2022-04-11 06:10:26.228 [rank:6] [train], epoch: 36/50, iter: 100/834, loss: 0.27357, lr: 0.274014, top1: 0.70187, throughput: 312.65 | 2022-04-11 06:10:26.249 [rank:5] [train], epoch: 36/50, iter: 100/834, loss: 0.27441, lr: 0.274014, top1: 0.69984, throughput: 312.48 | 2022-04-11 06:10:26.262 [rank:2] [train], epoch: 36/50, iter: 100/834, loss: 0.27414, lr: 0.274014, top1: 0.70177, throughput: 312.37 | 2022-04-11 06:10:26.273 [rank:7] [train], epoch: 36/50, iter: 100/834, loss: 0.27261, lr: 0.274014, top1: 0.70266, throughput: 312.39 | 2022-04-11 06:10:26.283 [rank:1] [train], epoch: 36/50, iter: 100/834, loss: 0.27443, lr: 0.274014, top1: 0.69953, throughput: 312.27 | 2022-04-11 06:10:26.284 [rank:0] [train], epoch: 36/50, iter: 100/834, loss: 0.27175, lr: 0.274014, top1: 0.70620, throughput: 312.19 | 2022-04-11 06:10:26.296 [rank:3] [train], epoch: 36/50, iter: 100/834, loss: 0.27547, lr: 0.274014, top1: 0.69698, throughput: 312.81 | 2022-04-11 06:10:26.223 [rank:6] [train], epoch: 36/50, iter: 200/834, loss: 0.27551, lr: 0.269598, top1: 0.70073, throughput: 314.45 | 2022-04-11 06:11:27.308 [rank:4] [train], epoch: 36/50, iter: 200/834, loss: 0.27544, lr: 0.269598, top1: 0.69802, throughput: 314.30 | 2022-04-11 06:11:27.317 [rank:0] [train], epoch: 36/50, iter: 200/834, loss: 0.27593, lr: 0.269598, top1: 0.69417, throughput: 314.64 | 2022-04-11 06:11:27.318 [rank:3] [train], epoch: 36/50, iter: 200/834, loss: 0.27543, lr: 0.269598, top1: 0.69865, throughput: 314.04 | 2022-04-11 06:11:27.361 [rank:5] [train], epoch: 36/50, iter: 200/834, loss: 0.27663, lr: 0.269598, top1: 0.69781, throughput: 314.18 | 2022-04-11 06:11:27.374 [rank:2] [train], epoch: 36/50, iter: 200/834, loss: 0.27562, lr: 0.269598, top1: 0.69797, throughput: 314.23 | 2022-04-11 06:11:27.375 [rank:1] [train], epoch: 36/50, iter: 200/834, loss: 0.27398, lr: 0.269598, top1: 0.69880, throughput: 314.23 | 2022-04-11 06:11:27.385 [rank:7] [train], epoch: 36/50, iter: 200/834, loss: 0.27241, lr: 0.269598, top1: 0.70328, throughput: 314.12 | 2022-04-11 06:11:27.406 [rank:5] [train], epoch: 36/50, iter: 300/834, loss: 0.27492, lr: 0.265210, top1: 0.70083, throughput: 311.80 | 2022-04-11 06:12:28.953 [rank:0] [train], epoch: 36/50, iter: 300/834, loss: 0.27698, lr: 0.265210, top1: 0.69354, throughput: 311.49 | 2022-04-11 06:12:28.957 [rank:7] [train], epoch: 36/50, iter: 300/834, loss: 0.27703, lr: 0.265210, top1: 0.69651, throughput: 311.88 | 2022-04-11 06:12:28.968 [rank:4] [train], epoch: 36/50, iter: 300/834, loss: 0.27626, lr: 0.265210, top1: 0.69094, throughput: 311.42 | 2022-04-11 06:12:28.970 [rank:1] [train], epoch: 36/50, iter: 300/834, loss: 0.27520, lr: 0.265210, top1: 0.69984, throughput: 311.61 | 2022-04-11 06:12:29.001 [rank:3] [train], epoch: 36/50, iter: 300/834, loss: 0.27531, lr: 0.265210, top1: 0.69839, throughput: 311.46 | 2022-04-11 06:12:29.007 [rank:6] [train], epoch: 36/50, iter: 300/834, loss: 0.27851, lr: 0.265210, top1: 0.68688, throughput: 311.14 | 2022-04-11 06:12:29.016 [rank:2] [train], epoch: 36/50, iter: 300/834, loss: 0.27716, lr: 0.265210, top1: 0.69385, throughput: 311.48 | 2022-04-11 06:12:29.017 [rank:2] [train], epoch: 36/50, iter: 400/834, loss: 0.27639, lr: 0.260851, top1: 0.69422, throughput: 312.31 | 2022-04-11 06:13:30.494 [rank:3] [train], epoch: 36/50, iter: 400/834, loss: 0.27310, lr: 0.260851, top1: 0.70333, throughput: 312.20 | 2022-04-11 06:13:30.506 [rank:0] [train], epoch: 36/50, iter: 400/834, loss: 0.27573, lr: 0.260851, top1: 0.69563, throughput: 311.93 | 2022-04-11 06:13:30.510 [rank:7] [train], epoch: 36/50, iter: 400/834, loss: 0.27510, lr: 0.260851, top1: 0.69646, throughput: 311.91 | 2022-04-11 06:13:30.526 [rank:4] [train], epoch: 36/50, iter: 400/834, loss: 0.27679, lr: 0.260851, top1: 0.69432, throughput: 311.90 | 2022-04-11 06:13:30.528 [rank:6] [train], epoch: 36/50, iter: 400/834, loss: 0.27428, lr: 0.260851, top1: 0.69745, throughput: 312.07 | 2022-04-11 06:13:30.540 [rank:5] [train], epoch: 36/50, iter: 400/834, loss: 0.27508, lr: 0.260851, top1: 0.69854, throughput: 311.70 | 2022-04-11 06:13:30.551 [rank:1] [train], epoch: 36/50, iter: 400/834, loss: 0.27546, lr: 0.260851, top1: 0.69641, throughput: 311.86 | 2022-04-11 06:13:30.568 [rank:7] [train], epoch: 36/50, iter: 500/834, loss: 0.27960, lr: 0.256520, top1: 0.69021, throughput: 312.71 | 2022-04-11 06:14:31.925 [rank:3] [train], epoch: 36/50, iter: 500/834, loss: 0.27847, lr: 0.256520, top1: 0.69083, throughput: 312.60 | 2022-04-11 06:14:31.926 [rank:4] [train], epoch: 36/50, iter: 500/834, loss: 0.27563, lr: 0.256520, top1: 0.69589, throughput: 312.70 | 2022-04-11 06:14:31.930 [rank:2] [train], epoch: 36/50, iter: 500/834, loss: 0.27733, lr: 0.256520, top1: 0.69250, throughput: 312.51 | 2022-04-11 06:14:31.932 [rank:1] [train], epoch: 36/50, iter: 500/834, loss: 0.27428, lr: 0.256520, top1: 0.69984, throughput: 312.80 | 2022-04-11 06:14:31.949 [rank:5] [train], epoch: 36/50, iter: 500/834, loss: 0.27627, lr: 0.256520, top1: 0.69250, throughput: 312.64 | 2022-04-11 06:14:31.964 [rank:0] [train], epoch: 36/50, iter: 500/834, loss: 0.27578, lr: 0.256520, top1: 0.69651, throughput: 312.37 | 2022-04-11 06:14:31.976 [rank:6] [train], epoch: 36/50, iter: 500/834, loss: 0.27774, lr: 0.256520, top1: 0.69474, throughput: 312.49 | 2022-04-11 06:14:31.982 [rank:7] [train], epoch: 36/50, iter: 600/834, loss: 0.27584, lr: 0.252219, top1: 0.69656, throughput: 313.80 | 2022-04-11 06:15:33.111 [rank:3] [train], epoch: 36/50, iter: 600/834, loss: 0.27556, lr: 0.252219, top1: 0.69641, throughput: 313.67 | 2022-04-11 06:15:33.138 [rank:6] [train], epoch: 36/50, iter: 600/834, loss: 0.27810, lr: 0.252219, top1: 0.69109, throughput: 313.91 | 2022-04-11 06:15:33.147 [rank:0] [train], epoch: 36/50, iter: 600/834, loss: 0.27691, lr: 0.252219, top1: 0.69286, throughput: 314.20 | 2022-04-11 06:15:33.084 [rank:4] [train], epoch: 36/50, iter: 600/834, loss: 0.27607, lr: 0.252219, top1: 0.69766, throughput: 313.58 | 2022-04-11 06:15:33.158 [rank:5] [train], epoch: 36/50, iter: 600/834, loss: 0.27712, lr: 0.252219, top1: 0.69391, throughput: 313.67 | 2022-04-11 06:15:33.176 [rank:2] [train], epoch: 36/50, iter: 600/834, loss: 0.27807, lr: 0.252219, top1: 0.69146, throughput: 313.50 | 2022-04-11 06:15:33.177 [rank:1] [train], epoch: 36/50, iter: 600/834, loss: 0.27784, lr: 0.252219, top1: 0.69250, throughput: 313.97 | 2022-04-11 06:15:33.101 [rank:4] [train], epoch: 36/50, iter: 700/834, loss: 0.27929, lr: 0.247946, top1: 0.68547, throughput: 311.59 | 2022-04-11 06:16:34.777 [rank:5] [train], epoch: 36/50, iter: 700/834, loss: 0.27691, lr: 0.247946, top1: 0.69609, throughput: 311.65 | 2022-04-11 06:16:34.784 [rank:1] [train], epoch: 36/50, iter: 700/834, loss: 0.27545, lr: 0.247946, top1: 0.69526, throughput: 311.10 | 2022-04-11 06:16:34.817 [rank:2] [train], epoch: 36/50, iter: 700/834, loss: 0.27757, lr: 0.247946, top1: 0.69255, throughput: 311.84 | 2022-04-11 06:16:34.747 [rank:3] [train], epoch: 36/50, iter: 700/834, loss: 0.27540, lr: 0.247946, top1: 0.69865, throughput: 311.22 | 2022-04-11 06:16:34.831 [rank:7] [train], epoch: 36/50, iter: 700/834, loss: 0.27625, lr: 0.247946, top1: 0.69516, throughput: 311.05 | 2022-04-11 06:16:34.837 [rank:6] [train], epoch: 36/50, iter: 700/834, loss: 0.27745, lr: 0.247946, top1: 0.69474, throughput: 311.21 | 2022-04-11 06:16:34.841 [rank:0] [train], epoch: 36/50, iter: 700/834, loss: 0.27796, lr: 0.247946, top1: 0.69135, throughput: 310.82 | 2022-04-11 06:16:34.855 [rank:3] [train], epoch: 36/50, iter: 800/834, loss: 0.27669, lr: 0.243704, top1: 0.69427, throughput: 315.05 | 2022-04-11 06:17:35.773 [rank:1] [train], epoch: 36/50, iter: 800/834, loss: 0.27655, lr: 0.243704, top1: 0.69167, throughput: 314.97 | 2022-04-11 06:17:35.775 [rank:2] [train], epoch: 36/50, iter: 800/834, loss: 0.27888, lr: 0.243704, top1: 0.69255, throughput: 314.56 | 2022-04-11 06:17:35.784 [rank:4] [train], epoch: 36/50, iter: 800/834, loss: 0.27499, lr: 0.243704, top1: 0.69807, throughput: 314.61 | 2022-04-11 06:17:35.805 [rank:6] [train], epoch: 36/50, iter: 800/834, loss: 0.27523, lr: 0.243704, top1: 0.69609, throughput: 314.93 | 2022-04-11 06:17:35.806 [rank:7] [train], epoch: 36/50, iter: 800/834, loss: 0.27910, lr: 0.243704, top1: 0.68906, throughput: 314.80 | 2022-04-11 06:17:35.829 [rank:0] [train], epoch: 36/50, iter: 800/834, loss: 0.27878, lr: 0.243704, top1: 0.69141, throughput: 314.74 | 2022-04-11 06:17:35.858 [rank:5] [train], epoch: 36/50, iter: 800/834, loss: 0.27718, lr: 0.243704, top1: 0.69385, throughput: 314.33 | 2022-04-11 06:17:35.866 [rank:2] [train], epoch: 36/50, iter: 834/834, loss: 0.27344, lr: 0.242268, top1: 0.69792, throughput: 312.94 | 2022-04-11 06:17:56.644 [rank:6] [train], epoch: 36/50, iter: 834/834, loss: 0.27659, lr: 0.242268, top1: 0.69424, throughput: 313.21 | 2022-04-11 06:17:56.648 [rank:3] [train], epoch: 36/50, iter: 834/834, loss: 0.27375, lr: 0.242268, top1: 0.70113, throughput: 312.67 | 2022-04-11 06:17:56.651 [rank:7] [train], epoch: 36/50, iter: 834/834, loss: 0.27814, lr: 0.242268, top1: 0.69194, throughput: 313.39 | 2022-04-11 06:17:56.659 [rank:1] [train], epoch: 36/50, iter: 834/834, loss: 0.27500, lr: 0.242268, top1: 0.69838, throughput: 312.47 | 2022-04-11 06:17:56.666 [rank:5] [train], epoch: 36/50, iter: 834/834, loss: 0.27670, lr: 0.242268, top1: 0.69225, throughput: 313.68 | 2022-04-11 06:17:56.677 [rank:0] [train], epoch: 36/50, iter: 834/834, loss: 0.28001, lr: 0.242268, top1: 0.68352, throughput: 313.39 | 2022-04-11 06:17:56.688 [rank:4] [train], epoch: 36/50, iter: 834/834, loss: 0.27755, lr: 0.242268, top1: 0.68903, throughput: 312.52 | 2022-04-11 06:17:56.694 [rank:0] [eval], epoch: 36/50, iter: 125/125, loss: 0.00000, lr: 0.242268, top1: 0.69824, throughput: 484.43 | 2022-04-11 06:18:09.590 [rank:1] [eval], epoch: 36/50, iter: 125/125, loss: 0.00000, lr: 0.242268, top1: 0.69056, throughput: 483.51 | 2022-04-11 06:18:09.593 [rank:2] [eval], epoch: 36/50, iter: 125/125, loss: 0.00000, lr: 0.242268, top1: 0.68176, throughput: 482.10 | 2022-04-11 06:18:09.608 [rank:5] [eval], epoch: 36/50, iter: 125/125, loss: 0.00000, lr: 0.242268, top1: 0.68272, throughput: 483.30 | 2022-04-11 06:18:09.609 [rank:4] [eval], epoch: 36/50, iter: 125/125, loss: 0.00000, lr: 0.242268, top1: 0.68944, throughput: 483.89 | 2022-04-11 06:18:09.610 [rank:7] [eval], epoch: 36/50, iter: 125/125, loss: 0.00000, lr: 0.242268, top1: 0.69104, throughput: 482.51 | 2022-04-11 06:18:09.612 [rank:3] [eval], epoch: 36/50, iter: 125/125, loss: 0.00000, lr: 0.242268, top1: 0.68160, throughput: 481.88 | 2022-04-11 06:18:09.621 [rank:6] [eval], epoch: 36/50, iter: 125/125, loss: 0.00000, lr: 0.242268, top1: 0.69232, throughput: 481.17 | 2022-04-11 06:18:09.638 [rank:6] [train], epoch: 37/50, iter: 100/834, loss: 0.27240, lr: 0.238065, top1: 0.69974, throughput: 314.84 | 2022-04-11 06:19:10.622 [rank:4] [train], epoch: 37/50, iter: 100/834, loss: 0.27187, lr: 0.238065, top1: 0.70641, throughput: 314.64 | 2022-04-11 06:19:10.633 [rank:1] [train], epoch: 37/50, iter: 100/834, loss: 0.27152, lr: 0.238065, top1: 0.70693, throughput: 314.52 | 2022-04-11 06:19:10.638 [rank:7] [train], epoch: 37/50, iter: 100/834, loss: 0.27337, lr: 0.238065, top1: 0.70089, throughput: 314.61 | 2022-04-11 06:19:10.640 [rank:0] [train], epoch: 37/50, iter: 100/834, loss: 0.27298, lr: 0.238065, top1: 0.70141, throughput: 314.46 | 2022-04-11 06:19:10.646 [rank:3] [train], epoch: 37/50, iter: 100/834, loss: 0.26935, lr: 0.238065, top1: 0.70724, throughput: 314.53 | 2022-04-11 06:19:10.664 [rank:5] [train], epoch: 37/50, iter: 100/834, loss: 0.26980, lr: 0.238065, top1: 0.71198, throughput: 314.42 | 2022-04-11 06:19:10.674 [rank:2] [train], epoch: 37/50, iter: 100/834, loss: 0.27235, lr: 0.238065, top1: 0.70828, throughput: 314.37 | 2022-04-11 06:19:10.682 [rank:4] [train], epoch: 37/50, iter: 200/834, loss: 0.27355, lr: 0.233892, top1: 0.70318, throughput: 312.86 | 2022-04-11 06:20:12.001 [rank:1] [train], epoch: 37/50, iter: 200/834, loss: 0.27097, lr: 0.233892, top1: 0.70609, throughput: 312.76 | 2022-04-11 06:20:12.026 [rank:0] [train], epoch: 37/50, iter: 200/834, loss: 0.27165, lr: 0.233892, top1: 0.70203, throughput: 312.65 | 2022-04-11 06:20:12.057 [rank:2] [train], epoch: 37/50, iter: 200/834, loss: 0.27057, lr: 0.233892, top1: 0.70609, throughput: 312.83 | 2022-04-11 06:20:12.058 [rank:7] [train], epoch: 37/50, iter: 200/834, loss: 0.27309, lr: 0.233892, top1: 0.70281, throughput: 312.58 | 2022-04-11 06:20:12.064 [rank:3] [train], epoch: 37/50, iter: 200/834, loss: 0.27221, lr: 0.233892, top1: 0.70646, throughput: 312.70 | 2022-04-11 06:20:12.065 [rank:6] [train], epoch: 37/50, iter: 200/834, loss: 0.27270, lr: 0.233892, top1: 0.70656, throughput: 312.44 | 2022-04-11 06:20:12.072 [rank:5] [train], epoch: 37/50, iter: 200/834, loss: 0.27194, lr: 0.233892, top1: 0.70266, throughput: 312.71 | 2022-04-11 06:20:12.073 [rank:6] [train], epoch: 37/50, iter: 300/834, loss: 0.27201, lr: 0.229750, top1: 0.70354, throughput: 312.67 | 2022-04-11 06:21:13.480 [rank:7] [train], epoch: 37/50, iter: 300/834, loss: 0.27051, lr: 0.229750, top1: 0.70854, throughput: 312.60 | 2022-04-11 06:21:13.484 [rank:5] [train], epoch: 37/50, iter: 300/834, loss: 0.27129, lr: 0.229750, top1: 0.70615, throughput: 312.48 | 2022-04-11 06:21:13.518 [rank:0] [train], epoch: 37/50, iter: 300/834, loss: 0.27303, lr: 0.229750, top1: 0.70042, throughput: 312.39 | 2022-04-11 06:21:13.519 [rank:4] [train], epoch: 37/50, iter: 300/834, loss: 0.27372, lr: 0.229750, top1: 0.70052, throughput: 312.10 | 2022-04-11 06:21:13.520 [rank:1] [train], epoch: 37/50, iter: 300/834, loss: 0.27082, lr: 0.229750, top1: 0.70740, throughput: 312.16 | 2022-04-11 06:21:13.533 [rank:2] [train], epoch: 37/50, iter: 300/834, loss: 0.27311, lr: 0.229750, top1: 0.70250, throughput: 312.32 | 2022-04-11 06:21:13.534 [rank:3] [train], epoch: 37/50, iter: 300/834, loss: 0.27421, lr: 0.229750, top1: 0.69953, throughput: 312.35 | 2022-04-11 06:21:13.534 [rank:6] [train], epoch: 37/50, iter: 400/834, loss: 0.27310, lr: 0.225638, top1: 0.70594, throughput: 312.56 | 2022-04-11 06:22:14.908 [rank:1] [train], epoch: 37/50, iter: 400/834, loss: 0.27131, lr: 0.225638, top1: 0.70443, throughput: 312.68 | 2022-04-11 06:22:14.937 [rank:4] [train], epoch: 37/50, iter: 400/834, loss: 0.26840, lr: 0.225638, top1: 0.71203, throughput: 312.35 | 2022-04-11 06:22:14.988 [rank:7] [train], epoch: 37/50, iter: 400/834, loss: 0.27334, lr: 0.225638, top1: 0.69849, throughput: 312.16 | 2022-04-11 06:22:14.990 [rank:0] [train], epoch: 37/50, iter: 400/834, loss: 0.27158, lr: 0.225638, top1: 0.70302, throughput: 312.30 | 2022-04-11 06:22:14.998 [rank:5] [train], epoch: 37/50, iter: 400/834, loss: 0.27107, lr: 0.225638, top1: 0.70536, throughput: 312.27 | 2022-04-11 06:22:15.003 [rank:3] [train], epoch: 37/50, iter: 400/834, loss: 0.27324, lr: 0.225638, top1: 0.69974, throughput: 312.34 | 2022-04-11 06:22:15.006 [rank:2] [train], epoch: 37/50, iter: 400/834, loss: 0.27142, lr: 0.225638, top1: 0.70557, throughput: 312.26 | 2022-04-11 06:22:15.020 [rank:5] [train], epoch: 37/50, iter: 500/834, loss: 0.27318, lr: 0.221557, top1: 0.70083, throughput: 312.62 | 2022-04-11 06:23:16.420 [rank:0] [train], epoch: 37/50, iter: 500/834, loss: 0.27198, lr: 0.221557, top1: 0.70078, throughput: 312.51 | 2022-04-11 06:23:16.437 [rank:3] [train], epoch: 37/50, iter: 500/834, loss: 0.27272, lr: 0.221557, top1: 0.70177, throughput: 312.51 | 2022-04-11 06:23:16.445 [rank:6] [train], epoch: 37/50, iter: 500/834, loss: 0.27365, lr: 0.221557, top1: 0.70276, throughput: 312.00 | 2022-04-11 06:23:16.448 [rank:2] [train], epoch: 37/50, iter: 500/834, loss: 0.27450, lr: 0.221557, top1: 0.70094, throughput: 312.55 | 2022-04-11 06:23:16.451 [rank:7] [train], epoch: 37/50, iter: 500/834, loss: 0.27155, lr: 0.221557, top1: 0.70156, throughput: 312.21 | 2022-04-11 06:23:16.487 [rank:4] [train], epoch: 37/50, iter: 500/834, loss: 0.27264, lr: 0.221557, top1: 0.70281, throughput: 312.12 | 2022-04-11 06:23:16.503 [rank:1] [train], epoch: 37/50, iter: 500/834, loss: 0.27368, lr: 0.221557, top1: 0.69849, throughput: 311.62 | 2022-04-11 06:23:16.550 [rank:5] [train], epoch: 37/50, iter: 600/834, loss: 0.27304, lr: 0.217507, top1: 0.70130, throughput: 311.22 | 2022-04-11 06:24:18.113 [rank:0] [train], epoch: 37/50, iter: 600/834, loss: 0.27114, lr: 0.217507, top1: 0.70333, throughput: 311.30 | 2022-04-11 06:24:18.115 [rank:1] [train], epoch: 37/50, iter: 600/834, loss: 0.27130, lr: 0.217507, top1: 0.70615, throughput: 311.86 | 2022-04-11 06:24:18.117 [rank:6] [train], epoch: 37/50, iter: 600/834, loss: 0.27258, lr: 0.217507, top1: 0.70641, throughput: 311.33 | 2022-04-11 06:24:18.118 [rank:7] [train], epoch: 37/50, iter: 600/834, loss: 0.27123, lr: 0.217507, top1: 0.70609, throughput: 311.44 | 2022-04-11 06:24:18.136 [rank:4] [train], epoch: 37/50, iter: 600/834, loss: 0.27132, lr: 0.217507, top1: 0.70943, throughput: 311.41 | 2022-04-11 06:24:18.158 [rank:2] [train], epoch: 37/50, iter: 600/834, loss: 0.27464, lr: 0.217507, top1: 0.69750, throughput: 311.08 | 2022-04-11 06:24:18.172 [rank:3] [train], epoch: 37/50, iter: 600/834, loss: 0.27427, lr: 0.217507, top1: 0.69948, throughput: 311.34 | 2022-04-11 06:24:18.113 [rank:5] [train], epoch: 37/50, iter: 700/834, loss: 0.27315, lr: 0.213488, top1: 0.69922, throughput: 312.95 | 2022-04-11 06:25:19.464 [rank:4] [train], epoch: 37/50, iter: 700/834, loss: 0.27439, lr: 0.213488, top1: 0.70000, throughput: 313.14 | 2022-04-11 06:25:19.472 [rank:6] [train], epoch: 37/50, iter: 700/834, loss: 0.27385, lr: 0.213488, top1: 0.70125, throughput: 312.79 | 2022-04-11 06:25:19.500 [rank:1] [train], epoch: 37/50, iter: 700/834, loss: 0.27108, lr: 0.213488, top1: 0.70708, throughput: 312.78 | 2022-04-11 06:25:19.502 [rank:7] [train], epoch: 37/50, iter: 700/834, loss: 0.27190, lr: 0.213488, top1: 0.70182, throughput: 312.83 | 2022-04-11 06:25:19.511 [rank:0] [train], epoch: 37/50, iter: 700/834, loss: 0.27298, lr: 0.213488, top1: 0.70198, throughput: 312.71 | 2022-04-11 06:25:19.514 [rank:2] [train], epoch: 37/50, iter: 700/834, loss: 0.27284, lr: 0.213488, top1: 0.69984, throughput: 312.91 | 2022-04-11 06:25:19.531 [rank:3] [train], epoch: 37/50, iter: 700/834, loss: 0.27341, lr: 0.213488, top1: 0.70234, throughput: 312.53 | 2022-04-11 06:25:19.547 [rank:4] [train], epoch: 37/50, iter: 800/834, loss: 0.27213, lr: 0.209501, top1: 0.70313, throughput: 312.95 | 2022-04-11 06:26:20.824 [rank:5] [train], epoch: 37/50, iter: 800/834, loss: 0.27554, lr: 0.209501, top1: 0.69724, throughput: 312.67 | 2022-04-11 06:26:20.872 [rank:6] [train], epoch: 37/50, iter: 800/834, loss: 0.27296, lr: 0.209501, top1: 0.70198, throughput: 312.83 | 2022-04-11 06:26:20.875 [rank:1] [train], epoch: 37/50, iter: 800/834, loss: 0.27375, lr: 0.209501, top1: 0.70047, throughput: 312.80 | 2022-04-11 06:26:20.882 [rank:2] [train], epoch: 37/50, iter: 800/834, loss: 0.27257, lr: 0.209501, top1: 0.70172, throughput: 312.87 | 2022-04-11 06:26:20.898 [rank:3] [train], epoch: 37/50, iter: 800/834, loss: 0.27180, lr: 0.209501, top1: 0.70443, throughput: 312.80 | 2022-04-11 06:26:20.929 [rank:0] [train], epoch: 37/50, iter: 800/834, loss: 0.27301, lr: 0.209501, top1: 0.70438, throughput: 312.58 | 2022-04-11 06:26:20.939 [rank:7] [train], epoch: 37/50, iter: 800/834, loss: 0.27288, lr: 0.209501, top1: 0.70193, throughput: 312.90 | 2022-04-11 06:26:20.874 [rank:7] [train], epoch: 37/50, iter: 834/834, loss: 0.27165, lr: 0.208152, top1: 0.70282, throughput: 310.65 | 2022-04-11 06:26:41.888 [rank:4] [train], epoch: 37/50, iter: 834/834, loss: 0.27574, lr: 0.208152, top1: 0.69608, throughput: 309.80 | 2022-04-11 06:26:41.895 [rank:5] [train], epoch: 37/50, iter: 834/834, loss: 0.27439, lr: 0.208152, top1: 0.70803, throughput: 310.49 | 2022-04-11 06:26:41.896 [rank:1] [train], epoch: 37/50, iter: 834/834, loss: 0.27664, lr: 0.208152, top1: 0.69638, throughput: 310.56 | 2022-04-11 06:26:41.902 [rank:0] [train], epoch: 37/50, iter: 834/834, loss: 0.26929, lr: 0.208152, top1: 0.70619, throughput: 311.33 | 2022-04-11 06:26:41.907 [rank:3] [train], epoch: 37/50, iter: 834/834, loss: 0.27008, lr: 0.208152, top1: 0.71186, throughput: 311.11 | 2022-04-11 06:26:41.912 [rank:6] [train], epoch: 37/50, iter: 834/834, loss: 0.27327, lr: 0.208152, top1: 0.70251, throughput: 310.31 | 2022-04-11 06:26:41.912 [rank:2] [train], epoch: 37/50, iter: 834/834, loss: 0.27077, lr: 0.208152, top1: 0.70971, throughput: 311.24 | 2022-04-11 06:26:41.872 [rank:0] [eval], epoch: 37/50, iter: 125/125, loss: 0.00000, lr: 0.208152, top1: 0.71712, throughput: 480.81 | 2022-04-11 06:26:54.905 [rank:1] [eval], epoch: 37/50, iter: 125/125, loss: 0.00000, lr: 0.208152, top1: 0.70592, throughput: 480.49 | 2022-04-11 06:26:54.910 [rank:2] [eval], epoch: 37/50, iter: 125/125, loss: 0.00000, lr: 0.208152, top1: 0.69776, throughput: 479.37 | 2022-04-11 06:26:54.910 [rank:7] [eval], epoch: 37/50, iter: 125/125, loss: 0.00000, lr: 0.208152, top1: 0.70560, throughput: 479.46 | 2022-04-11 06:26:54.923 [rank:5] [eval], epoch: 37/50, iter: 125/125, loss: 0.00000, lr: 0.208152, top1: 0.69792, throughput: 479.75 | 2022-04-11 06:26:54.924 [rank:4] [eval], epoch: 37/50, iter: 125/125, loss: 0.00000, lr: 0.208152, top1: 0.70304, throughput: 479.35 | 2022-04-11 06:26:54.934 [rank:3] [eval], epoch: 37/50, iter: 125/125, loss: 0.00000, lr: 0.208152, top1: 0.70384, throughput: 479.75 | 2022-04-11 06:26:54.939 [rank:6] [eval], epoch: 37/50, iter: 125/125, loss: 0.00000, lr: 0.208152, top1: 0.70992, throughput: 479.38 | 2022-04-11 06:26:54.949 [rank:4] [train], epoch: 38/50, iter: 100/834, loss: 0.26693, lr: 0.204207, top1: 0.71547, throughput: 314.59 | 2022-04-11 06:27:55.966 [rank:5] [train], epoch: 38/50, iter: 100/834, loss: 0.26518, lr: 0.204207, top1: 0.72068, throughput: 314.51 | 2022-04-11 06:27:55.972 [rank:3] [train], epoch: 38/50, iter: 100/834, loss: 0.26700, lr: 0.204207, top1: 0.71792, throughput: 314.50 | 2022-04-11 06:27:55.989 [rank:7] [train], epoch: 38/50, iter: 100/834, loss: 0.26540, lr: 0.204207, top1: 0.71609, throughput: 314.37 | 2022-04-11 06:27:55.997 [rank:2] [train], epoch: 38/50, iter: 100/834, loss: 0.26927, lr: 0.204207, top1: 0.70979, throughput: 314.23 | 2022-04-11 06:27:56.011 [rank:1] [train], epoch: 38/50, iter: 100/834, loss: 0.26742, lr: 0.204207, top1: 0.71667, throughput: 314.16 | 2022-04-11 06:27:56.024 [rank:0] [train], epoch: 38/50, iter: 100/834, loss: 0.26759, lr: 0.204207, top1: 0.71615, throughput: 314.10 | 2022-04-11 06:27:56.032 [rank:6] [train], epoch: 38/50, iter: 100/834, loss: 0.26739, lr: 0.204207, top1: 0.71589, throughput: 314.20 | 2022-04-11 06:27:56.056 [rank:0] [train], epoch: 38/50, iter: 200/834, loss: 0.26771, lr: 0.200294, top1: 0.70875, throughput: 313.54 | 2022-04-11 06:28:57.269 [rank:5] [train], epoch: 38/50, iter: 200/834, loss: 0.26921, lr: 0.200294, top1: 0.70844, throughput: 313.09 | 2022-04-11 06:28:57.297 [rank:7] [train], epoch: 38/50, iter: 200/834, loss: 0.26708, lr: 0.200294, top1: 0.71208, throughput: 313.16 | 2022-04-11 06:28:57.308 [rank:1] [train], epoch: 38/50, iter: 200/834, loss: 0.26737, lr: 0.200294, top1: 0.71510, throughput: 313.30 | 2022-04-11 06:28:57.308 [rank:3] [train], epoch: 38/50, iter: 200/834, loss: 0.26785, lr: 0.200294, top1: 0.71120, throughput: 313.10 | 2022-04-11 06:28:57.310 [rank:6] [train], epoch: 38/50, iter: 200/834, loss: 0.26579, lr: 0.200294, top1: 0.71766, throughput: 313.44 | 2022-04-11 06:28:57.313 [rank:2] [train], epoch: 38/50, iter: 200/834, loss: 0.26813, lr: 0.200294, top1: 0.71099, throughput: 313.16 | 2022-04-11 06:28:57.322 [rank:4] [train], epoch: 38/50, iter: 200/834, loss: 0.26665, lr: 0.200294, top1: 0.71526, throughput: 312.89 | 2022-04-11 06:28:57.330 [rank:6] [train], epoch: 38/50, iter: 300/834, loss: 0.26892, lr: 0.196414, top1: 0.71453, throughput: 314.97 | 2022-04-11 06:29:58.270 [rank:2] [train], epoch: 38/50, iter: 300/834, loss: 0.26669, lr: 0.196414, top1: 0.71656, throughput: 314.77 | 2022-04-11 06:29:58.319 [rank:3] [train], epoch: 38/50, iter: 300/834, loss: 0.26945, lr: 0.196414, top1: 0.71135, throughput: 314.71 | 2022-04-11 06:29:58.319 [rank:4] [train], epoch: 38/50, iter: 300/834, loss: 0.26811, lr: 0.196414, top1: 0.71385, throughput: 314.77 | 2022-04-11 06:29:58.328 [rank:1] [train], epoch: 38/50, iter: 300/834, loss: 0.26864, lr: 0.196414, top1: 0.70937, throughput: 314.63 | 2022-04-11 06:29:58.332 [rank:0] [train], epoch: 38/50, iter: 300/834, loss: 0.26642, lr: 0.196414, top1: 0.71526, throughput: 314.39 | 2022-04-11 06:29:58.339 [rank:7] [train], epoch: 38/50, iter: 300/834, loss: 0.26861, lr: 0.196414, top1: 0.71010, throughput: 314.55 | 2022-04-11 06:29:58.347 [rank:5] [train], epoch: 38/50, iter: 300/834, loss: 0.26755, lr: 0.196414, top1: 0.71234, throughput: 314.27 | 2022-04-11 06:29:58.390 [rank:5] [train], epoch: 38/50, iter: 400/834, loss: 0.26768, lr: 0.192566, top1: 0.71562, throughput: 313.07 | 2022-04-11 06:30:59.719 [rank:2] [train], epoch: 38/50, iter: 400/834, loss: 0.26769, lr: 0.192566, top1: 0.71328, throughput: 312.59 | 2022-04-11 06:30:59.741 [rank:1] [train], epoch: 38/50, iter: 400/834, loss: 0.26535, lr: 0.192566, top1: 0.71677, throughput: 312.51 | 2022-04-11 06:30:59.770 [rank:4] [train], epoch: 38/50, iter: 400/834, loss: 0.26855, lr: 0.192566, top1: 0.71172, throughput: 312.49 | 2022-04-11 06:30:59.770 [rank:3] [train], epoch: 38/50, iter: 400/834, loss: 0.26995, lr: 0.192566, top1: 0.70646, throughput: 312.35 | 2022-04-11 06:30:59.790 [rank:6] [train], epoch: 38/50, iter: 400/834, loss: 0.26741, lr: 0.192566, top1: 0.71380, throughput: 312.09 | 2022-04-11 06:30:59.790 [rank:7] [train], epoch: 38/50, iter: 400/834, loss: 0.26490, lr: 0.192566, top1: 0.71807, throughput: 312.46 | 2022-04-11 06:30:59.795 [rank:0] [train], epoch: 38/50, iter: 400/834, loss: 0.26979, lr: 0.192566, top1: 0.70937, throughput: 312.39 | 2022-04-11 06:30:59.801 [rank:4] [train], epoch: 38/50, iter: 500/834, loss: 0.26671, lr: 0.188750, top1: 0.71667, throughput: 313.83 | 2022-04-11 06:32:00.951 [rank:6] [train], epoch: 38/50, iter: 500/834, loss: 0.26724, lr: 0.188750, top1: 0.70901, throughput: 313.92 | 2022-04-11 06:32:00.953 [rank:2] [train], epoch: 38/50, iter: 500/834, loss: 0.26960, lr: 0.188750, top1: 0.70891, throughput: 313.61 | 2022-04-11 06:32:00.965 [rank:7] [train], epoch: 38/50, iter: 500/834, loss: 0.26956, lr: 0.188750, top1: 0.71057, throughput: 313.68 | 2022-04-11 06:32:01.004 [rank:1] [train], epoch: 38/50, iter: 500/834, loss: 0.26403, lr: 0.188750, top1: 0.71865, throughput: 313.51 | 2022-04-11 06:32:01.013 [rank:0] [train], epoch: 38/50, iter: 500/834, loss: 0.26719, lr: 0.188750, top1: 0.71203, throughput: 313.61 | 2022-04-11 06:32:01.023 [rank:3] [train], epoch: 38/50, iter: 500/834, loss: 0.26699, lr: 0.188750, top1: 0.71573, throughput: 313.42 | 2022-04-11 06:32:01.049 [rank:5] [train], epoch: 38/50, iter: 500/834, loss: 0.26514, lr: 0.188750, top1: 0.71781, throughput: 313.01 | 2022-04-11 06:32:01.059 [rank:5] [train], epoch: 38/50, iter: 600/834, loss: 0.26737, lr: 0.184968, top1: 0.71745, throughput: 312.34 | 2022-04-11 06:33:02.531 [rank:2] [train], epoch: 38/50, iter: 600/834, loss: 0.26851, lr: 0.184968, top1: 0.71120, throughput: 311.85 | 2022-04-11 06:33:02.533 [rank:6] [train], epoch: 38/50, iter: 600/834, loss: 0.26790, lr: 0.184968, top1: 0.71198, throughput: 311.71 | 2022-04-11 06:33:02.549 [rank:3] [train], epoch: 38/50, iter: 600/834, loss: 0.26620, lr: 0.184968, top1: 0.71641, throughput: 312.19 | 2022-04-11 06:33:02.550 [rank:7] [train], epoch: 38/50, iter: 600/834, loss: 0.26678, lr: 0.184968, top1: 0.71641, throughput: 311.92 | 2022-04-11 06:33:02.558 [rank:4] [train], epoch: 38/50, iter: 600/834, loss: 0.26925, lr: 0.184968, top1: 0.70859, throughput: 311.64 | 2022-04-11 06:33:02.559 [rank:1] [train], epoch: 38/50, iter: 600/834, loss: 0.26655, lr: 0.184968, top1: 0.71432, throughput: 311.93 | 2022-04-11 06:33:02.566 [rank:0] [train], epoch: 38/50, iter: 600/834, loss: 0.26704, lr: 0.184968, top1: 0.71385, throughput: 311.94 | 2022-04-11 06:33:02.573 [rank:2] [train], epoch: 38/50, iter: 700/834, loss: 0.26851, lr: 0.181218, top1: 0.70870, throughput: 311.95 | 2022-04-11 06:34:04.082 [rank:5] [train], epoch: 38/50, iter: 700/834, loss: 0.27152, lr: 0.181218, top1: 0.70193, throughput: 311.85 | 2022-04-11 06:34:04.099 [rank:4] [train], epoch: 38/50, iter: 700/834, loss: 0.26892, lr: 0.181218, top1: 0.71000, throughput: 311.94 | 2022-04-11 06:34:04.109 [rank:7] [train], epoch: 38/50, iter: 700/834, loss: 0.26950, lr: 0.181218, top1: 0.70818, throughput: 311.88 | 2022-04-11 06:34:04.121 [rank:3] [train], epoch: 38/50, iter: 700/834, loss: 0.26857, lr: 0.181218, top1: 0.70766, throughput: 311.71 | 2022-04-11 06:34:04.145 [rank:6] [train], epoch: 38/50, iter: 700/834, loss: 0.26983, lr: 0.181218, top1: 0.71094, throughput: 311.70 | 2022-04-11 06:34:04.147 [rank:0] [train], epoch: 38/50, iter: 700/834, loss: 0.26807, lr: 0.181218, top1: 0.70984, throughput: 311.67 | 2022-04-11 06:34:04.176 [rank:1] [train], epoch: 38/50, iter: 700/834, loss: 0.26574, lr: 0.181218, top1: 0.71385, throughput: 311.52 | 2022-04-11 06:34:04.199 [rank:0] [train], epoch: 38/50, iter: 800/834, loss: 0.26544, lr: 0.177502, top1: 0.71745, throughput: 314.19 | 2022-04-11 06:35:05.286 [rank:1] [train], epoch: 38/50, iter: 800/834, loss: 0.26840, lr: 0.177502, top1: 0.71234, throughput: 314.24 | 2022-04-11 06:35:05.299 [rank:5] [train], epoch: 38/50, iter: 800/834, loss: 0.26717, lr: 0.177502, top1: 0.71495, throughput: 313.66 | 2022-04-11 06:35:05.312 [rank:3] [train], epoch: 38/50, iter: 800/834, loss: 0.26953, lr: 0.177502, top1: 0.71172, throughput: 313.82 | 2022-04-11 06:35:05.326 [rank:6] [train], epoch: 38/50, iter: 800/834, loss: 0.26811, lr: 0.177502, top1: 0.71208, throughput: 313.80 | 2022-04-11 06:35:05.332 [rank:4] [train], epoch: 38/50, iter: 800/834, loss: 0.26872, lr: 0.177502, top1: 0.70839, throughput: 313.55 | 2022-04-11 06:35:05.342 [rank:2] [train], epoch: 38/50, iter: 800/834, loss: 0.26981, lr: 0.177502, top1: 0.70896, throughput: 313.41 | 2022-04-11 06:35:05.343 [rank:7] [train], epoch: 38/50, iter: 800/834, loss: 0.26532, lr: 0.177502, top1: 0.71453, throughput: 313.56 | 2022-04-11 06:35:05.354 [rank:6] [train], epoch: 38/50, iter: 834/834, loss: 0.26702, lr: 0.176246, top1: 0.71339, throughput: 316.24 | 2022-04-11 06:35:25.975 [rank:5] [train], epoch: 38/50, iter: 834/834, loss: 0.26424, lr: 0.176246, top1: 0.71385, throughput: 315.83 | 2022-04-11 06:35:25.981 [rank:0] [train], epoch: 38/50, iter: 834/834, loss: 0.26574, lr: 0.176246, top1: 0.71354, throughput: 315.37 | 2022-04-11 06:35:25.985 [rank:7] [train], epoch: 38/50, iter: 834/834, loss: 0.26544, lr: 0.176246, top1: 0.71615, throughput: 316.33 | 2022-04-11 06:35:25.991 [rank:3] [train], epoch: 38/50, iter: 834/834, loss: 0.26466, lr: 0.176246, top1: 0.72151, throughput: 315.87 | 2022-04-11 06:35:25.993 [rank:4] [train], epoch: 38/50, iter: 834/834, loss: 0.26501, lr: 0.176246, top1: 0.71752, throughput: 316.05 | 2022-04-11 06:35:25.997 [rank:1] [train], epoch: 38/50, iter: 834/834, loss: 0.26565, lr: 0.176246, top1: 0.71722, throughput: 315.31 | 2022-04-11 06:35:26.003 [rank:2] [train], epoch: 38/50, iter: 834/834, loss: 0.26900, lr: 0.176246, top1: 0.70956, throughput: 315.94 | 2022-04-11 06:35:26.005 [rank:0] [eval], epoch: 38/50, iter: 125/125, loss: 0.00000, lr: 0.176246, top1: 0.72224, throughput: 481.72 | 2022-04-11 06:35:38.960 [rank:1] [eval], epoch: 38/50, iter: 125/125, loss: 0.00000, lr: 0.176246, top1: 0.71344, throughput: 482.34 | 2022-04-11 06:35:38.960 [rank:2] [eval], epoch: 38/50, iter: 125/125, loss: 0.00000, lr: 0.176246, top1: 0.70208, throughput: 482.06 | 2022-04-11 06:35:38.970 [rank:4] [eval], epoch: 38/50, iter: 125/125, loss: 0.00000, lr: 0.176246, top1: 0.71440, throughput: 481.39 | 2022-04-11 06:35:38.981 [rank:7] [eval], epoch: 38/50, iter: 125/125, loss: 0.00000, lr: 0.176246, top1: 0.71344, throughput: 481.10 | 2022-04-11 06:35:38.982 [rank:5] [eval], epoch: 38/50, iter: 125/125, loss: 0.00000, lr: 0.176246, top1: 0.71008, throughput: 480.73 | 2022-04-11 06:35:38.982 [rank:3] [eval], epoch: 38/50, iter: 125/125, loss: 0.00000, lr: 0.176246, top1: 0.70816, throughput: 480.45 | 2022-04-11 06:35:39.001 [rank:6] [eval], epoch: 38/50, iter: 125/125, loss: 0.00000, lr: 0.176246, top1: 0.71632, throughput: 479.63 | 2022-04-11 06:35:39.006 [rank:4] [train], epoch: 39/50, iter: 100/834, loss: 0.26467, lr: 0.172575, top1: 0.71802, throughput: 313.15 | 2022-04-11 06:36:40.293 [rank:5] [train], epoch: 39/50, iter: 100/834, loss: 0.26394, lr: 0.172575, top1: 0.72406, throughput: 313.03 | 2022-04-11 06:36:40.319 [rank:0] [train], epoch: 39/50, iter: 100/834, loss: 0.26357, lr: 0.172575, top1: 0.72255, throughput: 312.70 | 2022-04-11 06:36:40.360 [rank:2] [train], epoch: 39/50, iter: 100/834, loss: 0.25929, lr: 0.172575, top1: 0.73130, throughput: 312.68 | 2022-04-11 06:36:40.374 [rank:3] [train], epoch: 39/50, iter: 100/834, loss: 0.26177, lr: 0.172575, top1: 0.72786, throughput: 312.70 | 2022-04-11 06:36:40.403 [rank:7] [train], epoch: 39/50, iter: 100/834, loss: 0.26049, lr: 0.172575, top1: 0.73104, throughput: 312.56 | 2022-04-11 06:36:40.410 [rank:6] [train], epoch: 39/50, iter: 100/834, loss: 0.26288, lr: 0.172575, top1: 0.72313, throughput: 312.66 | 2022-04-11 06:36:40.414 [rank:1] [train], epoch: 39/50, iter: 100/834, loss: 0.26378, lr: 0.172575, top1: 0.72260, throughput: 312.42 | 2022-04-11 06:36:40.416 [rank:2] [train], epoch: 39/50, iter: 200/834, loss: 0.26278, lr: 0.168937, top1: 0.72214, throughput: 313.97 | 2022-04-11 06:37:41.527 [rank:4] [train], epoch: 39/50, iter: 200/834, loss: 0.26256, lr: 0.168937, top1: 0.72099, throughput: 313.49 | 2022-04-11 06:37:41.540 [rank:6] [train], epoch: 39/50, iter: 200/834, loss: 0.26336, lr: 0.168937, top1: 0.72193, throughput: 313.93 | 2022-04-11 06:37:41.574 [rank:7] [train], epoch: 39/50, iter: 200/834, loss: 0.26406, lr: 0.168937, top1: 0.72182, throughput: 313.90 | 2022-04-11 06:37:41.575 [rank:5] [train], epoch: 39/50, iter: 200/834, loss: 0.26133, lr: 0.168937, top1: 0.72370, throughput: 313.43 | 2022-04-11 06:37:41.577 [rank:0] [train], epoch: 39/50, iter: 200/834, loss: 0.26291, lr: 0.168937, top1: 0.72193, throughput: 313.54 | 2022-04-11 06:37:41.597 [rank:1] [train], epoch: 39/50, iter: 200/834, loss: 0.26328, lr: 0.168937, top1: 0.72130, throughput: 313.79 | 2022-04-11 06:37:41.604 [rank:3] [train], epoch: 39/50, iter: 200/834, loss: 0.26436, lr: 0.168937, top1: 0.72089, throughput: 313.89 | 2022-04-11 06:37:41.571 [rank:2] [train], epoch: 39/50, iter: 300/834, loss: 0.26443, lr: 0.165334, top1: 0.71818, throughput: 313.35 | 2022-04-11 06:38:42.801 [rank:0] [train], epoch: 39/50, iter: 300/834, loss: 0.26543, lr: 0.165334, top1: 0.71745, throughput: 313.63 | 2022-04-11 06:38:42.815 [rank:1] [train], epoch: 39/50, iter: 300/834, loss: 0.26584, lr: 0.165334, top1: 0.71766, throughput: 313.67 | 2022-04-11 06:38:42.815 [rank:6] [train], epoch: 39/50, iter: 300/834, loss: 0.26192, lr: 0.165334, top1: 0.72786, throughput: 313.47 | 2022-04-11 06:38:42.824 [rank:3] [train], epoch: 39/50, iter: 300/834, loss: 0.26504, lr: 0.165334, top1: 0.71828, throughput: 313.39 | 2022-04-11 06:38:42.837 [rank:5] [train], epoch: 39/50, iter: 300/834, loss: 0.26300, lr: 0.165334, top1: 0.72375, throughput: 313.39 | 2022-04-11 06:38:42.842 [rank:7] [train], epoch: 39/50, iter: 300/834, loss: 0.26304, lr: 0.165334, top1: 0.72156, throughput: 313.17 | 2022-04-11 06:38:42.884 [rank:4] [train], epoch: 39/50, iter: 300/834, loss: 0.26395, lr: 0.165334, top1: 0.72172, throughput: 313.48 | 2022-04-11 06:38:42.787 [rank:5] [train], epoch: 39/50, iter: 400/834, loss: 0.26335, lr: 0.161764, top1: 0.72078, throughput: 312.99 | 2022-04-11 06:39:44.187 [rank:2] [train], epoch: 39/50, iter: 400/834, loss: 0.26264, lr: 0.161764, top1: 0.72292, throughput: 312.64 | 2022-04-11 06:39:44.213 [rank:0] [train], epoch: 39/50, iter: 400/834, loss: 0.26310, lr: 0.161764, top1: 0.71880, throughput: 312.61 | 2022-04-11 06:39:44.233 [rank:6] [train], epoch: 39/50, iter: 400/834, loss: 0.26504, lr: 0.161764, top1: 0.71922, throughput: 312.61 | 2022-04-11 06:39:44.243 [rank:7] [train], epoch: 39/50, iter: 400/834, loss: 0.26087, lr: 0.161764, top1: 0.72865, throughput: 312.83 | 2022-04-11 06:39:44.259 [rank:4] [train], epoch: 39/50, iter: 400/834, loss: 0.26339, lr: 0.161764, top1: 0.72062, throughput: 312.77 | 2022-04-11 06:39:44.173 [rank:3] [train], epoch: 39/50, iter: 400/834, loss: 0.26596, lr: 0.161764, top1: 0.71750, throughput: 312.51 | 2022-04-11 06:39:44.275 [rank:1] [train], epoch: 39/50, iter: 400/834, loss: 0.26405, lr: 0.161764, top1: 0.71609, throughput: 312.37 | 2022-04-11 06:39:44.281 [rank:4] [train], epoch: 39/50, iter: 500/834, loss: 0.26316, lr: 0.158229, top1: 0.72125, throughput: 312.12 | 2022-04-11 06:40:45.688 [rank:2] [train], epoch: 39/50, iter: 500/834, loss: 0.26343, lr: 0.158229, top1: 0.71896, throughput: 312.19 | 2022-04-11 06:40:45.713 [rank:6] [train], epoch: 39/50, iter: 500/834, loss: 0.26297, lr: 0.158229, top1: 0.71885, throughput: 312.28 | 2022-04-11 06:40:45.727 [rank:1] [train], epoch: 39/50, iter: 500/834, loss: 0.26373, lr: 0.158229, top1: 0.71990, throughput: 312.42 | 2022-04-11 06:40:45.737 [rank:3] [train], epoch: 39/50, iter: 500/834, loss: 0.26280, lr: 0.158229, top1: 0.72240, throughput: 312.29 | 2022-04-11 06:40:45.757 [rank:0] [train], epoch: 39/50, iter: 500/834, loss: 0.26083, lr: 0.158229, top1: 0.72234, throughput: 312.06 | 2022-04-11 06:40:45.760 [rank:5] [train], epoch: 39/50, iter: 500/834, loss: 0.26116, lr: 0.158229, top1: 0.72688, throughput: 311.69 | 2022-04-11 06:40:45.786 [rank:7] [train], epoch: 39/50, iter: 500/834, loss: 0.26681, lr: 0.158229, top1: 0.71057, throughput: 312.46 | 2022-04-11 06:40:45.706 [rank:0] [train], epoch: 39/50, iter: 600/834, loss: 0.26685, lr: 0.154729, top1: 0.71849, throughput: 310.99 | 2022-04-11 06:41:47.498 [rank:1] [train], epoch: 39/50, iter: 600/834, loss: 0.26343, lr: 0.154729, top1: 0.72297, throughput: 310.80 | 2022-04-11 06:41:47.512 [rank:3] [train], epoch: 39/50, iter: 600/834, loss: 0.26526, lr: 0.154729, top1: 0.72141, throughput: 310.89 | 2022-04-11 06:41:47.514 [rank:7] [train], epoch: 39/50, iter: 600/834, loss: 0.26760, lr: 0.154729, top1: 0.71318, throughput: 310.61 | 2022-04-11 06:41:47.521 [rank:5] [train], epoch: 39/50, iter: 600/834, loss: 0.26574, lr: 0.154729, top1: 0.71536, throughput: 311.00 | 2022-04-11 06:41:47.523 [rank:4] [train], epoch: 39/50, iter: 600/834, loss: 0.26211, lr: 0.154729, top1: 0.72240, throughput: 310.49 | 2022-04-11 06:41:47.526 [rank:6] [train], epoch: 39/50, iter: 600/834, loss: 0.26573, lr: 0.154729, top1: 0.71802, throughput: 310.59 | 2022-04-11 06:41:47.544 [rank:2] [train], epoch: 39/50, iter: 600/834, loss: 0.26282, lr: 0.154729, top1: 0.71818, throughput: 310.51 | 2022-04-11 06:41:47.547 [rank:5] [train], epoch: 39/50, iter: 700/834, loss: 0.26336, lr: 0.151264, top1: 0.72130, throughput: 313.04 | 2022-04-11 06:42:48.858 [rank:4] [train], epoch: 39/50, iter: 700/834, loss: 0.26293, lr: 0.151264, top1: 0.72146, throughput: 313.00 | 2022-04-11 06:42:48.867 [rank:1] [train], epoch: 39/50, iter: 700/834, loss: 0.26321, lr: 0.151264, top1: 0.72161, throughput: 312.92 | 2022-04-11 06:42:48.870 [rank:0] [train], epoch: 39/50, iter: 700/834, loss: 0.26462, lr: 0.151264, top1: 0.71646, throughput: 312.62 | 2022-04-11 06:42:48.915 [rank:3] [train], epoch: 39/50, iter: 700/834, loss: 0.26250, lr: 0.151264, top1: 0.72229, throughput: 312.69 | 2022-04-11 06:42:48.917 [rank:7] [train], epoch: 39/50, iter: 700/834, loss: 0.26332, lr: 0.151264, top1: 0.72026, throughput: 312.71 | 2022-04-11 06:42:48.919 [rank:6] [train], epoch: 39/50, iter: 700/834, loss: 0.26161, lr: 0.151264, top1: 0.72516, throughput: 312.81 | 2022-04-11 06:42:48.923 [rank:2] [train], epoch: 39/50, iter: 700/834, loss: 0.26187, lr: 0.151264, top1: 0.72198, throughput: 312.76 | 2022-04-11 06:42:48.935 [rank:4] [train], epoch: 39/50, iter: 800/834, loss: 0.26181, lr: 0.147833, top1: 0.72417, throughput: 312.88 | 2022-04-11 06:43:50.233 [rank:3] [train], epoch: 39/50, iter: 800/834, loss: 0.26102, lr: 0.147833, top1: 0.72646, throughput: 313.08 | 2022-04-11 06:43:50.243 [rank:0] [train], epoch: 39/50, iter: 800/834, loss: 0.26332, lr: 0.147833, top1: 0.72359, throughput: 313.04 | 2022-04-11 06:43:50.248 [rank:2] [train], epoch: 39/50, iter: 800/834, loss: 0.26213, lr: 0.147833, top1: 0.72516, throughput: 313.08 | 2022-04-11 06:43:50.262 [rank:7] [train], epoch: 39/50, iter: 800/834, loss: 0.26267, lr: 0.147833, top1: 0.72042, throughput: 312.98 | 2022-04-11 06:43:50.265 [rank:6] [train], epoch: 39/50, iter: 800/834, loss: 0.26139, lr: 0.147833, top1: 0.72464, throughput: 312.94 | 2022-04-11 06:43:50.278 [rank:1] [train], epoch: 39/50, iter: 800/834, loss: 0.26479, lr: 0.147833, top1: 0.71974, throughput: 312.62 | 2022-04-11 06:43:50.287 [rank:5] [train], epoch: 39/50, iter: 800/834, loss: 0.26298, lr: 0.147833, top1: 0.72135, throughput: 312.41 | 2022-04-11 06:43:50.316 [rank:0] [train], epoch: 39/50, iter: 834/834, loss: 0.26459, lr: 0.146675, top1: 0.72258, throughput: 312.87 | 2022-04-11 06:44:11.113 [rank:4] [train], epoch: 39/50, iter: 834/834, loss: 0.26050, lr: 0.146675, top1: 0.72472, throughput: 312.56 | 2022-04-11 06:44:11.119 [rank:2] [train], epoch: 39/50, iter: 834/834, loss: 0.26393, lr: 0.146675, top1: 0.72120, throughput: 312.87 | 2022-04-11 06:44:11.127 [rank:1] [train], epoch: 39/50, iter: 834/834, loss: 0.26380, lr: 0.146675, top1: 0.71768, throughput: 313.10 | 2022-04-11 06:44:11.136 [rank:5] [train], epoch: 39/50, iter: 834/834, loss: 0.26780, lr: 0.146675, top1: 0.70971, throughput: 313.52 | 2022-04-11 06:44:11.138 [rank:6] [train], epoch: 39/50, iter: 834/834, loss: 0.26442, lr: 0.146675, top1: 0.71783, throughput: 312.77 | 2022-04-11 06:44:11.149 [rank:3] [train], epoch: 39/50, iter: 834/834, loss: 0.26088, lr: 0.146675, top1: 0.72549, throughput: 311.95 | 2022-04-11 06:44:11.170 [rank:7] [train], epoch: 39/50, iter: 834/834, loss: 0.25882, lr: 0.146675, top1: 0.72442, throughput: 312.24 | 2022-04-11 06:44:11.172 [rank:0] [eval], epoch: 39/50, iter: 125/125, loss: 0.00000, lr: 0.146675, top1: 0.73408, throughput: 480.80 | 2022-04-11 06:44:24.112 [rank:2] [eval], epoch: 39/50, iter: 125/125, loss: 0.00000, lr: 0.146675, top1: 0.71792, throughput: 481.06 | 2022-04-11 06:44:24.120 [rank:1] [eval], epoch: 39/50, iter: 125/125, loss: 0.00000, lr: 0.146675, top1: 0.73216, throughput: 481.34 | 2022-04-11 06:44:24.121 [rank:3] [eval], epoch: 39/50, iter: 125/125, loss: 0.00000, lr: 0.146675, top1: 0.72720, throughput: 482.35 | 2022-04-11 06:44:24.127 [rank:4] [eval], epoch: 39/50, iter: 125/125, loss: 0.00000, lr: 0.146675, top1: 0.72704, throughput: 480.44 | 2022-04-11 06:44:24.128 [rank:5] [eval], epoch: 39/50, iter: 125/125, loss: 0.00000, lr: 0.146675, top1: 0.72048, throughput: 480.96 | 2022-04-11 06:44:24.132 [rank:7] [eval], epoch: 39/50, iter: 125/125, loss: 0.00000, lr: 0.146675, top1: 0.73472, throughput: 481.78 | 2022-04-11 06:44:24.145 [rank:6] [eval], epoch: 39/50, iter: 125/125, loss: 0.00000, lr: 0.146675, top1: 0.72720, throughput: 480.44 | 2022-04-11 06:44:24.158 [rank:4] [train], epoch: 40/50, iter: 100/834, loss: 0.25857, lr: 0.143292, top1: 0.73005, throughput: 313.07 | 2022-04-11 06:45:25.456 [rank:1] [train], epoch: 40/50, iter: 100/834, loss: 0.25855, lr: 0.143292, top1: 0.73464, throughput: 313.00 | 2022-04-11 06:45:25.462 [rank:6] [train], epoch: 40/50, iter: 100/834, loss: 0.25653, lr: 0.143292, top1: 0.73714, throughput: 313.11 | 2022-04-11 06:45:25.478 [rank:5] [train], epoch: 40/50, iter: 100/834, loss: 0.25859, lr: 0.143292, top1: 0.73099, throughput: 313.23 | 2022-04-11 06:45:25.430 [rank:0] [train], epoch: 40/50, iter: 100/834, loss: 0.25685, lr: 0.143292, top1: 0.73458, throughput: 312.82 | 2022-04-11 06:45:25.488 [rank:7] [train], epoch: 40/50, iter: 100/834, loss: 0.25674, lr: 0.143292, top1: 0.73432, throughput: 313.28 | 2022-04-11 06:45:25.431 [rank:2] [train], epoch: 40/50, iter: 100/834, loss: 0.25795, lr: 0.143292, top1: 0.73448, throughput: 313.22 | 2022-04-11 06:45:25.417 [rank:3] [train], epoch: 40/50, iter: 100/834, loss: 0.25712, lr: 0.143292, top1: 0.73464, throughput: 313.18 | 2022-04-11 06:45:25.434 [rank:5] [train], epoch: 40/50, iter: 200/834, loss: 0.26087, lr: 0.139944, top1: 0.72792, throughput: 312.33 | 2022-04-11 06:46:26.902 [rank:7] [train], epoch: 40/50, iter: 200/834, loss: 0.25812, lr: 0.139944, top1: 0.72828, throughput: 312.11 | 2022-04-11 06:46:26.947 [rank:1] [train], epoch: 40/50, iter: 200/834, loss: 0.25756, lr: 0.139944, top1: 0.73396, throughput: 312.22 | 2022-04-11 06:46:26.957 [rank:4] [train], epoch: 40/50, iter: 200/834, loss: 0.26029, lr: 0.139944, top1: 0.72901, throughput: 312.13 | 2022-04-11 06:46:26.968 [rank:2] [train], epoch: 40/50, iter: 200/834, loss: 0.26205, lr: 0.139944, top1: 0.72141, throughput: 311.89 [rank:0] [train], epoch: 40/50, iter: 200/834, loss: 0.25915, lr: 0.139944, top1: 0.72760, throughput: 312.25| 2022-04-11 06:46:26.977 | 2022-04-11 06:46:26.977 [rank:6] [train], epoch: 40/50, iter: 200/834, loss: 0.25907, lr: 0.139944, top1: 0.73583, throughput: 312.16 | 2022-04-11 06:46:26.986 [rank:3] [train], epoch: 40/50, iter: 200/834, loss: 0.25812, lr: 0.139944, top1: 0.73641, throughput: 311.69 | 2022-04-11 06:46:27.034 [rank:1] [train], epoch: 40/50, iter: 300/834, loss: 0.25966, lr: 0.136632, top1: 0.72901, throughput: 314.52 | 2022-04-11 06:47:28.003 [rank:5] [train], epoch: 40/50, iter: 300/834, loss: 0.25993, lr: 0.136632, top1: 0.73406, throughput: 314.17 | 2022-04-11 06:47:28.016 [rank:2] [train], epoch: 40/50, iter: 300/834, loss: 0.25828, lr: 0.136632, top1: 0.73021, throughput: 314.49 | 2022-04-11 06:47:28.028 [rank:0] [train], epoch: 40/50, iter: 300/834, loss: 0.25972, lr: 0.136632, top1: 0.72828, throughput: 314.49 | 2022-04-11 06:47:28.028 [rank:4] [train], epoch: 40/50, iter: 300/834, loss: 0.26131, lr: 0.136632, top1: 0.72625, throughput: 314.44 | 2022-04-11 06:47:28.030 [rank:3] [train], epoch: 40/50, iter: 300/834, loss: 0.25829, lr: 0.136632, top1: 0.73229, throughput: 314.75 | 2022-04-11 06:47:28.035 [rank:6] [train], epoch: 40/50, iter: 300/834, loss: 0.25944, lr: 0.136632, top1: 0.72974, throughput: 314.45 | 2022-04-11 06:47:28.045 [rank:7] [train], epoch: 40/50, iter: 300/834, loss: 0.26064, lr: 0.136632, top1: 0.73104, throughput: 314.17 | 2022-04-11 06:47:28.060 [rank:5] [train], epoch: 40/50, iter: 400/834, loss: 0.25800, lr: 0.133356, top1: 0.73104, throughput: 312.93 | 2022-04-11 06:48:29.371 [rank:3] [train], epoch: 40/50, iter: 400/834, loss: 0.25635, lr: 0.133356, top1: 0.73635, throughput: 312.92 | 2022-04-11 06:48:29.392 [rank:6] [train], epoch: 40/50, iter: 400/834, loss: 0.25890, lr: 0.133356, top1: 0.73167, throughput: 312.95 | 2022-04-11 06:48:29.398 [rank:0] [train], epoch: 40/50, iter: 400/834, loss: 0.25797, lr: 0.133356, top1: 0.73490, throughput: 312.86 | 2022-04-11 06:48:29.398 [rank:1] [train], epoch: 40/50, iter: 400/834, loss: 0.25890, lr: 0.133356, top1: 0.73031, throughput: 312.56 | 2022-04-11 06:48:29.431 [rank:7] [train], epoch: 40/50, iter: 400/834, loss: 0.25966, lr: 0.133356, top1: 0.73141, throughput: 312.81 | 2022-04-11 06:48:29.439 [rank:2] [train], epoch: 40/50, iter: 400/834, loss: 0.26085, lr: 0.133356, top1: 0.72609, throughput: 312.62 | 2022-04-11 06:48:29.443 [rank:4] [train], epoch: 40/50, iter: 400/834, loss: 0.25929, lr: 0.133356, top1: 0.73505, throughput: 312.57 | 2022-04-11 06:48:29.455 [rank:6] [train], epoch: 40/50, iter: 500/834, loss: 0.25863, lr: 0.130115, top1: 0.72948, throughput: 311.99 | 2022-04-11 06:49:30.938 [rank:4] [train], epoch: 40/50, iter: 500/834, loss: 0.26057, lr: 0.130115, top1: 0.72615, throughput: 312.15 | 2022-04-11 06:49:30.965 [rank:7] [train], epoch: 40/50, iter: 500/834, loss: 0.25857, lr: 0.130115, top1: 0.73323, throughput: 312.06 | 2022-04-11 06:49:30.967 [rank:5] [train], epoch: 40/50, iter: 500/834, loss: 0.25832, lr: 0.130115, top1: 0.72734, throughput: 311.66 | 2022-04-11 06:49:30.978 [rank:2] [train], epoch: 40/50, iter: 500/834, loss: 0.26071, lr: 0.130115, top1: 0.72521, throughput: 311.97 | 2022-04-11 06:49:30.989 [rank:0] [train], epoch: 40/50, iter: 500/834, loss: 0.25826, lr: 0.130115, top1: 0.73339, throughput: 311.69 | 2022-04-11 06:49:30.998 [rank:1] [train], epoch: 40/50, iter: 500/834, loss: 0.25931, lr: 0.130115, top1: 0.72969, throughput: 311.74 | 2022-04-11 06:49:31.022 [rank:3] [train], epoch: 40/50, iter: 500/834, loss: 0.25921, lr: 0.130115, top1: 0.73068, throughput: 311.41 | 2022-04-11 06:49:31.046 [rank:1] [train], epoch: 40/50, iter: 600/834, loss: 0.25896, lr: 0.126911, top1: 0.73266, throughput: 313.45 | 2022-04-11 06:50:32.275 [rank:5] [train], epoch: 40/50, iter: 600/834, loss: 0.25815, lr: 0.126911, top1: 0.73214, throughput: 313.10 | 2022-04-11 06:50:32.300 [rank:7] [train], epoch: 40/50, iter: 600/834, loss: 0.25916, lr: 0.126911, top1: 0.72995, throughput: 313.01 | 2022-04-11 06:50:32.306 [rank:2] [train], epoch: 40/50, iter: 600/834, loss: 0.26034, lr: 0.126911, top1: 0.73057, throughput: 313.12 | 2022-04-11 06:50:32.306 [rank:6] [train], epoch: 40/50, iter: 600/834, loss: 0.25944, lr: 0.126911, top1: 0.72849, throughput: 312.77 | 2022-04-11 06:50:32.326 [rank:3] [train], epoch: 40/50, iter: 600/834, loss: 0.25795, lr: 0.126911, top1: 0.73359, throughput: 313.15 | 2022-04-11 06:50:32.359 [rank:4] [train], epoch: 40/50, iter: 600/834, loss: 0.25967, lr: 0.126911, top1: 0.72729, throughput: 312.73 | 2022-04-11 06:50:32.359 [rank:0] [train], epoch: 40/50, iter: 600/834, loss: 0.26036, lr: 0.126911, top1: 0.72687, throughput: 313.24 | 2022-04-11 06:50:32.294 [rank:2] [train], epoch: 40/50, iter: 700/834, loss: 0.26024, lr: 0.123743, top1: 0.72901, throughput: 312.20 | 2022-04-11 06:51:33.806 [rank:0] [train], epoch: 40/50, iter: 700/834, loss: 0.25750, lr: 0.123743, top1: 0.72802, throughput: 312.09 | 2022-04-11 06:51:33.815 [rank:6] [train], epoch: 40/50, iter: 700/834, loss: 0.25739, lr: 0.123743, top1: 0.73359, throughput: 312.24 | 2022-04-11 06:51:33.818 [rank:3] [train], epoch: 40/50, iter: 700/834, loss: 0.25902, lr: 0.123743, top1: 0.73083, throughput: 312.31 | 2022-04-11 06:51:33.835 [rank:5] [train], epoch: 40/50, iter: 700/834, loss: 0.25784, lr: 0.123743, top1: 0.73130, throughput: 311.97 | 2022-04-11 06:51:33.843 [rank:7] [train], epoch: 40/50, iter: 700/834, loss: 0.26002, lr: 0.123743, top1: 0.72911, throughput: 311.90 | 2022-04-11 06:51:33.864 [rank:1] [train], epoch: 40/50, iter: 700/834, loss: 0.25987, lr: 0.123743, top1: 0.72932, throughput: 311.71 | 2022-04-11 06:51:33.871 [rank:4] [train], epoch: 40/50, iter: 700/834, loss: 0.26037, lr: 0.123743, top1: 0.72490, throughput: 312.12 | 2022-04-11 06:51:33.873 [rank:2] [train], epoch: 40/50, iter: 800/834, loss: 0.25873, lr: 0.120612, top1: 0.72818, throughput: 312.31 | 2022-04-11 06:52:35.284 [rank:5] [train], epoch: 40/50, iter: 800/834, loss: 0.25902, lr: 0.120612, top1: 0.72896, throughput: 312.34 | 2022-04-11 06:52:35.315 [rank:4] [train], epoch: 40/50, iter: 800/834, loss: 0.25949, lr: 0.120612, top1: 0.73036, throughput: 312.46 | 2022-04-11 06:52:35.321 [rank:3] [train], epoch: 40/50, iter: 800/834, loss: 0.25607, lr: 0.120612, top1: 0.73656, throughput: 312.24 | 2022-04-11 06:52:35.326 [rank:0] [train], epoch: 40/50, iter: 800/834, loss: 0.25791, lr: 0.120612, top1: 0.73380, throughput: 312.13 | 2022-04-11 06:52:35.328 [rank:1] [train], epoch: 40/50, iter: 800/834, loss: 0.25905, lr: 0.120612, top1: 0.73318, throughput: 312.21 | 2022-04-11 06:52:35.369 [rank:6] [train], epoch: 40/50, iter: 800/834, loss: 0.25873, lr: 0.120612, top1: 0.72917, throughput: 311.93 | 2022-04-11 06:52:35.370 [rank:7] [train], epoch: 40/50, iter: 800/834, loss: 0.25648, lr: 0.120612, top1: 0.73458, throughput: 312.53 | 2022-04-11 06:52:35.298 [rank:6] [train], epoch: 40/50, iter: 834/834, loss: 0.26058, lr: 0.119556, top1: 0.72595, throughput: 312.79 | 2022-04-11 06:52:56.241 [rank:5] [train], epoch: 40/50, iter: 834/834, loss: 0.26089, lr: 0.119556, top1: 0.72089, throughput: 311.90 | 2022-04-11 06:52:56.245 [rank:2] [train], epoch: 40/50, iter: 834/834, loss: 0.25899, lr: 0.119556, top1: 0.73361, throughput: 311.34 | 2022-04-11 06:52:56.251 [rank:3] [train], epoch: 40/50, iter: 834/834, loss: 0.25759, lr: 0.119556, top1: 0.73453, throughput: 311.97 | 2022-04-11 06:52:56.252 [rank:7] [train], epoch: 40/50, iter: 834/834, loss: 0.26129, lr: 0.119556, top1: 0.72335, throughput: 311.46 | 2022-04-11 06:52:56.257 [rank:1] [train], epoch: 40/50, iter: 834/834, loss: 0.25768, lr: 0.119556, top1: 0.73637, throughput: 312.43 | 2022-04-11 06:52:56.263 [rank:0] [train], epoch: 40/50, iter: 834/834, loss: 0.25733, lr: 0.119556, top1: 0.73192, throughput: 311.65 | 2022-04-11 06:52:56.275 [rank:4] [train], epoch: 40/50, iter: 834/834, loss: 0.26283, lr: 0.119556, top1: 0.72718, throughput: 311.06 | 2022-04-11 06:52:56.308 [rank:0] [eval], epoch: 40/50, iter: 125/125, loss: 0.00000, lr: 0.119556, top1: 0.73248, throughput: 489.78 | 2022-04-11 06:53:09.036 [rank:1] [eval], epoch: 40/50, iter: 125/125, loss: 0.00000, lr: 0.119556, top1: 0.73632, throughput: 488.99 | 2022-04-11 06:53:09.044 [rank:2] [eval], epoch: 40/50, iter: 125/125, loss: 0.00000, lr: 0.119556, top1: 0.72608, throughput: 488.37 | 2022-04-11 06:53:09.049 [rank:4] [eval], epoch: 40/50, iter: 125/125, loss: 0.00000, lr: 0.119556, top1: 0.73328, throughput: 490.36 | 2022-04-11 06:53:09.054 [rank:3] [eval], epoch: 40/50, iter: 125/125, loss: 0.00000, lr: 0.119556, top1: 0.73168, throughput: 488.17 | 2022-04-11 06:53:09.055 [rank:7] [eval], epoch: 40/50, iter: 125/125, loss: 0.00000, lr: 0.119556, top1: 0.74016, throughput: 487.95 | 2022-04-11 06:53:09.066 [rank:5] [eval], epoch: 40/50, iter: 125/125, loss: 0.00000, lr: 0.119556, top1: 0.73024, throughput: 487.46 | 2022-04-11 06:53:09.066 [rank:6] [eval], epoch: 40/50, iter: 125/125, loss: 0.00000, lr: 0.119556, top1: 0.73664, throughput: 486.66 | 2022-04-11 06:53:09.083 [rank:3] [train], epoch: 41/50, iter: 100/834, loss: 0.25387, lr: 0.116474, top1: 0.74089, throughput: 315.34 | 2022-04-11 06:54:09.940 [rank:0] [train], epoch: 41/50, iter: 100/834, loss: 0.25706, lr: 0.116474, top1: 0.73365, throughput: 315.23 | 2022-04-11 06:54:09.944 [rank:2] [train], epoch: 41/50, iter: 100/834, loss: 0.25053, lr: 0.116474, top1: 0.74849, throughput: 315.23 | 2022-04-11 06:54:09.956 [rank:5] [train], epoch: 41/50, iter: 100/834, loss: 0.25404, lr: 0.116474, top1: 0.74500, throughput: 315.31 | 2022-04-11 06:54:09.958 [rank:4] [train], epoch: 41/50, iter: 100/834, loss: 0.25325, lr: 0.116474, top1: 0.74219, throughput: 315.19 | 2022-04-11 06:54:09.969 [rank:1] [train], epoch: 41/50, iter: 100/834, loss: 0.25545, lr: 0.116474, top1: 0.73859, throughput: 315.13 | 2022-04-11 06:54:09.971 [rank:6] [train], epoch: 41/50, iter: 100/834, loss: 0.25633, lr: 0.116474, top1: 0.73792, throughput: 315.13 | 2022-04-11 06:54:10.010 [rank:7] [train], epoch: 41/50, iter: 100/834, loss: 0.25393, lr: 0.116474, top1: 0.74312, throughput: 315.02 | 2022-04-11 06:54:10.014 [rank:6] [train], epoch: 41/50, iter: 200/834, loss: 0.25361, lr: 0.113429, top1: 0.73990, throughput: 313.10 | 2022-04-11 06:55:11.333 [rank:5] [train], epoch: 41/50, iter: 200/834, loss: 0.25360, lr: 0.113429, top1: 0.74448, throughput: 312.83 | 2022-04-11 06:55:11.334 [rank:4] [train], epoch: 41/50, iter: 200/834, loss: 0.25372, lr: 0.113429, top1: 0.74026, throughput: 312.74 | 2022-04-11 06:55:11.361 [rank:2] [train], epoch: 41/50, iter: 200/834, loss: 0.25589, lr: 0.113429, top1: 0.73776, throughput: 312.62 | 2022-04-11 06:55:11.373 [rank:0] [train], epoch: 41/50, iter: 200/834, loss: 0.25302, lr: 0.113429, top1: 0.74250, throughput: 312.52 | 2022-04-11 06:55:11.380 [rank:3] [train], epoch: 41/50, iter: 200/834, loss: 0.25278, lr: 0.113429, top1: 0.74198, throughput: 312.45 | 2022-04-11 06:55:11.389 [rank:1] [train], epoch: 41/50, iter: 200/834, loss: 0.25472, lr: 0.113429, top1: 0.74031, throughput: 312.57 | 2022-04-11 06:55:11.396 [rank:7] [train], epoch: 41/50, iter: 200/834, loss: 0.25465, lr: 0.113429, top1: 0.73849, throughput: 312.66 | 2022-04-11 06:55:11.423 [rank:3] [train], epoch: 41/50, iter: 300/834, loss: 0.25372, lr: 0.110422, top1: 0.74156, throughput: 312.75 | 2022-04-11 06:56:12.781 [rank:0] [train], epoch: 41/50, iter: 300/834, loss: 0.25494, lr: 0.110422, top1: 0.74000, throughput: 312.67 | 2022-04-11 06:56:12.787 [rank:2] [train], epoch: 41/50, iter: 300/834, loss: 0.25225, lr: 0.110422, top1: 0.74599, throughput: 312.59 | 2022-04-11 06:56:12.795 [rank:1] [train], epoch: 41/50, iter: 300/834, loss: 0.25378, lr: 0.110422, top1: 0.74010, throughput: 312.66 | 2022-04-11 06:56:12.805 [rank:4] [train], epoch: 41/50, iter: 300/834, loss: 0.25521, lr: 0.110422, top1: 0.73896, throughput: 312.42 | 2022-04-11 06:56:12.817 [rank:5] [train], epoch: 41/50, iter: 300/834, loss: 0.25587, lr: 0.110422, top1: 0.74078, throughput: 312.24 | 2022-04-11 06:56:12.825 [rank:6] [train], epoch: 41/50, iter: 300/834, loss: 0.25516, lr: 0.110422, top1: 0.73854, throughput: 312.18 | 2022-04-11 06:56:12.836 [rank:7] [train], epoch: 41/50, iter: 300/834, loss: 0.25366, lr: 0.110422, top1: 0.73922, throughput: 312.58 | 2022-04-11 06:56:12.847 [rank:4] [train], epoch: 41/50, iter: 400/834, loss: 0.25290, lr: 0.107451, top1: 0.74391, throughput: 311.76 | 2022-04-11 06:57:14.402 [rank:5] [train], epoch: 41/50, iter: 400/834, loss: 0.25624, lr: 0.107451, top1: 0.73760, throughput: 311.79 | 2022-04-11 06:57:14.406 [rank:3] [train], epoch: 41/50, iter: 400/834, loss: 0.25485, lr: 0.107451, top1: 0.73927, throughput: 311.43 | 2022-04-11 06:57:14.432 [rank:6] [train], epoch: 41/50, iter: 400/834, loss: 0.25706, lr: 0.107451, top1: 0.73036, throughput: 311.69 | 2022-04-11 06:57:14.435 [rank:0] [train], epoch: 41/50, iter: 400/834, loss: 0.25226, lr: 0.107451, top1: 0.74349, throughput: 311.44 | 2022-04-11 06:57:14.437 [rank:1] [train], epoch: 41/50, iter: 400/834, loss: 0.25493, lr: 0.107451, top1: 0.74161, throughput: 311.50 | 2022-04-11 06:57:14.443 [rank:7] [train], epoch: 41/50, iter: 400/834, loss: 0.25293, lr: 0.107451, top1: 0.74661, throughput: 311.70 | 2022-04-11 06:57:14.444 [rank:2] [train], epoch: 41/50, iter: 400/834, loss: 0.25504, lr: 0.107451, top1: 0.74083, throughput: 311.34 | 2022-04-11 06:57:14.464 [rank:6] [train], epoch: 41/50, iter: 500/834, loss: 0.25494, lr: 0.104518, top1: 0.73937, throughput: 313.43 | 2022-04-11 06:58:15.693 [rank:4] [train], epoch: 41/50, iter: 500/834, loss: 0.25393, lr: 0.104518, top1: 0.74443, throughput: 313.20 | 2022-04-11 06:58:15.706 [rank:2] [train], epoch: 41/50, iter: 500/834, loss: 0.25715, lr: 0.104518, top1: 0.73422, throughput: 313.46 | 2022-04-11 06:58:15.716 [rank:5] [train], epoch: 41/50, iter: 500/834, loss: 0.25536, lr: 0.104518, top1: 0.73724, throughput: 313.08 | 2022-04-11 06:58:15.732 [rank:0] [train], epoch: 41/50, iter: 500/834, loss: 0.25557, lr: 0.104518, top1: 0.73578, throughput: 313.19 | 2022-04-11 06:58:15.742 [rank:3] [train], epoch: 41/50, iter: 500/834, loss: 0.25406, lr: 0.104518, top1: 0.73943, throughput: 313.50 | 2022-04-11 06:58:15.675 [rank:1] [train], epoch: 41/50, iter: 500/834, loss: 0.25612, lr: 0.104518, top1: 0.73635, throughput: 313.54 | 2022-04-11 06:58:15.678 [rank:7] [train], epoch: 41/50, iter: 500/834, loss: 0.25525, lr: 0.104518, top1: 0.73911, throughput: 312.96 | 2022-04-11 06:58:15.794 [rank:3] [train], epoch: 41/50, iter: 600/834, loss: 0.25333, lr: 0.101623, top1: 0.74130, throughput: 313.50 | 2022-04-11 06:59:16.919 [rank:5] [train], epoch: 41/50, iter: 600/834, loss: 0.25629, lr: 0.101623, top1: 0.73849, throughput: 313.78 | 2022-04-11 06:59:16.922 [rank:4] [train], epoch: 41/50, iter: 600/834, loss: 0.25317, lr: 0.101623, top1: 0.74359, throughput: 313.62 | 2022-04-11 06:59:16.927 [rank:6] [train], epoch: 41/50, iter: 600/834, loss: 0.25420, lr: 0.101623, top1: 0.73984, throughput: 313.38 | 2022-04-11 06:59:16.960 [rank:2] [train], epoch: 41/50, iter: 600/834, loss: 0.25226, lr: 0.101623, top1: 0.74240, throughput: 313.48 | 2022-04-11 06:59:16.964 [rank:1] [train], epoch: 41/50, iter: 600/834, loss: 0.25615, lr: 0.101623, top1: 0.73495, throughput: 313.04 | 2022-04-11 06:59:17.012 [rank:7] [train], epoch: 41/50, iter: 600/834, loss: 0.25588, lr: 0.101623, top1: 0.73917, throughput: 313.59 | 2022-04-11 06:59:17.021 [rank:0] [train], epoch: 41/50, iter: 600/834, loss: 0.25670, lr: 0.101623, top1: 0.73667, throughput: 313.30 | 2022-04-11 06:59:17.025 [rank:4] [train], epoch: 41/50, iter: 700/834, loss: 0.25421, lr: 0.098766, top1: 0.73677, throughput: 314.65 | 2022-04-11 07:00:17.947 [rank:1] [train], epoch: 41/50, iter: 700/834, loss: 0.25732, lr: 0.098766, top1: 0.73490, throughput: 315.01 | 2022-04-11 07:00:17.962 [rank:6] [train], epoch: 41/50, iter: 700/834, loss: 0.25459, lr: 0.098766, top1: 0.73802, throughput: 314.70 | 2022-04-11 07:00:17.971 [rank:7] [train], epoch: 41/50, iter: 700/834, loss: 0.25430, lr: 0.098766, top1: 0.74073, throughput: 315.01 | 2022-04-11 07:00:17.972 [rank:2] [train], epoch: 41/50, iter: 700/834, loss: 0.25348, lr: 0.098766, top1: 0.74182, throughput: 314.59 | 2022-04-11 07:00:17.996 [rank:3] [train], epoch: 41/50, iter: 700/834, loss: 0.25370, lr: 0.098766, top1: 0.73901, throughput: 314.29 | 2022-04-11 07:00:18.009 [rank:5] [train], epoch: 41/50, iter: 700/834, loss: 0.25354, lr: 0.098766, top1: 0.73880, throughput: 314.26 | 2022-04-11 07:00:18.017 [rank:0] [train], epoch: 41/50, iter: 700/834, loss: 0.25195, lr: 0.098766, top1: 0.74542, throughput: 315.15 | 2022-04-11 07:00:17.949 [rank:1] [train], epoch: 41/50, iter: 800/834, loss: 0.25598, lr: 0.095946, top1: 0.73609, throughput: 313.69 | 2022-04-11 07:01:19.168 [rank:4] [train], epoch: 41/50, iter: 800/834, loss: 0.25311, lr: 0.095946, top1: 0.74495, throughput: 313.46 | 2022-04-11 07:01:19.199 [rank:3] [train], epoch: 41/50, iter: 800/834, loss: 0.25332, lr: 0.095946, top1: 0.74016, throughput: 313.66 | 2022-04-11 07:01:19.222 [rank:5] [train], epoch: 41/50, iter: 800/834, loss: 0.25478, lr: 0.095946, top1: 0.73880, throughput: 313.65 | 2022-04-11 07:01:19.232 [rank:2] [train], epoch: 41/50, iter: 800/834, loss: 0.25330, lr: 0.095946, top1: 0.74042, throughput: 313.52 | 2022-04-11 07:01:19.236 [rank:7] [train], epoch: 41/50, iter: 800/834, loss: 0.25535, lr: 0.095946, top1: 0.73760, throughput: 313.40 | 2022-04-11 07:01:19.235 [rank:6] [train], epoch: 41/50, iter: 800/834, loss: 0.25452, lr: 0.095946, top1: 0.73828, throughput: 313.18 | 2022-04-11 07:01:19.277 [rank:0] [train], epoch: 41/50, iter: 800/834, loss: 0.25476, lr: 0.095946, top1: 0.73958, throughput: 313.00 | 2022-04-11 07:01:19.291 [rank:5] [train], epoch: 41/50, iter: 834/834, loss: 0.25430, lr: 0.094996, top1: 0.73882, throughput: 309.82 | 2022-04-11 07:01:40.303 [rank:4] [train], epoch: 41/50, iter: 834/834, loss: 0.25193, lr: 0.094996, top1: 0.74663, throughput: 309.31 | 2022-04-11 07:01:40.304 [rank:0] [train], epoch: 41/50, iter: 834/834, loss: 0.25654, lr: 0.094996, top1: 0.73024, throughput: 310.67 | 2022-04-11 07:01:40.304 [rank:2] [train], epoch: 41/50, iter: 834/834, loss: 0.25241, lr: 0.094996, top1: 0.74847, throughput: 309.85 | 2022-04-11 07:01:40.304 [rank:6] [train], epoch: 41/50, iter: 834/834, loss: 0.25775, lr: 0.094996, top1: 0.73055, throughput: 310.44 | 2022-04-11 07:01:40.305 [rank:1] [train], epoch: 41/50, iter: 834/834, loss: 0.25423, lr: 0.094996, top1: 0.74234, throughput: 308.72 | 2022-04-11 07:01:40.313 [rank:3] [train], epoch: 41/50, iter: 834/834, loss: 0.25484, lr: 0.094996, top1: 0.73912, throughput: 309.47 | 2022-04-11 07:01:40.316 [rank:7] [train], epoch: 41/50, iter: 834/834, loss: 0.25885, lr: 0.094996, top1: 0.72886, throughput: 309.12 | 2022-04-11 07:01:40.353 [rank:0] [eval], epoch: 41/50, iter: 125/125, loss: 0.00000, lr: 0.094996, top1: 0.73568, throughput: 487.28 | 2022-04-11 07:01:53.130 [rank:1] [eval], epoch: 41/50, iter: 125/125, loss: 0.00000, lr: 0.094996, top1: 0.73712, throughput: 487.42 | 2022-04-11 07:01:53.136 [rank:2] [eval], epoch: 41/50, iter: 125/125, loss: 0.00000, lr: 0.094996, top1: 0.72128, throughput: 487.05 | 2022-04-11 07:01:53.136 [rank:3] [eval], epoch: 41/50, iter: 125/125, loss: 0.00000, lr: 0.094996, top1: 0.72240, throughput: 487.18 | 2022-04-11 07:01:53.145 [rank:5] [eval], epoch: 41/50, iter: 125/125, loss: 0.00000, lr: 0.094996, top1: 0.72544, throughput: 486.09 | 2022-04-11 07:01:53.160 [rank:4] [eval], epoch: 41/50, iter: 125/125, loss: 0.00000, lr: 0.094996, top1: 0.72720, throughput: 486.00 | 2022-04-11 07:01:53.164 [rank:7] [eval], epoch: 41/50, iter: 125/125, loss: 0.00000, lr: 0.094996, top1: 0.73856, throughput: 487.34 | 2022-04-11 07:01:53.178 [rank:6] [eval], epoch: 41/50, iter: 125/125, loss: 0.00000, lr: 0.094996, top1: 0.73456, throughput: 485.51 | 2022-04-11 07:01:53.178 [rank:3] [train], epoch: 42/50, iter: 100/834, loss: 0.25001, lr: 0.092228, top1: 0.75063, throughput: 313.70 | 2022-04-11 07:02:54.350 [rank:2] [train], epoch: 42/50, iter: 100/834, loss: 0.24801, lr: 0.092228, top1: 0.75380, throughput: 313.65 | 2022-04-11 07:02:54.350 [rank:1] [train], epoch: 42/50, iter: 100/834, loss: 0.25098, lr: 0.092228, top1: 0.74880, throughput: 313.65 | 2022-04-11 07:02:54.351 [rank:4] [train], epoch: 42/50, iter: 100/834, loss: 0.24897, lr: 0.092228, top1: 0.74932, throughput: 313.70 | 2022-04-11 07:02:54.369 [rank:0] [train], epoch: 42/50, iter: 100/834, loss: 0.24838, lr: 0.092228, top1: 0.75115, throughput: 313.43 | 2022-04-11 07:02:54.387 [rank:7] [train], epoch: 42/50, iter: 100/834, loss: 0.24950, lr: 0.092228, top1: 0.75359, throughput: 313.67 | 2022-04-11 07:02:54.389 [rank:6] [train], epoch: 42/50, iter: 100/834, loss: 0.25169, lr: 0.092228, top1: 0.74620, throughput: 313.63 | 2022-04-11 07:02:54.397 [rank:5] [train], epoch: 42/50, iter: 100/834, loss: 0.24837, lr: 0.092228, top1: 0.75125, throughput: 313.87 | 2022-04-11 07:02:54.332 [rank:6] [train], epoch: 42/50, iter: 200/834, loss: 0.25000, lr: 0.089498, top1: 0.74885, throughput: 314.63 | 2022-04-11 07:03:55.421 [rank:7] [train], epoch: 42/50, iter: 200/834, loss: 0.24943, lr: 0.089498, top1: 0.75193, throughput: 314.55 | 2022-04-11 07:03:55.428 [rank:3] [train], epoch: 42/50, iter: 200/834, loss: 0.25024, lr: 0.089498, top1: 0.75104, throughput: 314.26 | 2022-04-11 07:03:55.447 [rank:0] [train], epoch: 42/50, iter: 200/834, loss: 0.24982, lr: 0.089498, top1: 0.74917, throughput: 314.40 | 2022-04-11 07:03:55.457 [rank:4] [train], epoch: 42/50, iter: 200/834, loss: 0.25159, lr: 0.089498, top1: 0.74333, throughput: 314.27 | 2022-04-11 07:03:55.463 [rank:5] [train], epoch: 42/50, iter: 200/834, loss: 0.24791, lr: 0.089498, top1: 0.75266, throughput: 314.08 | 2022-04-11 07:03:55.463 [rank:1] [train], epoch: 42/50, iter: 200/834, loss: 0.25261, lr: 0.089498, top1: 0.74255, throughput: 314.17 | 2022-04-11 07:03:55.464 [rank:2] [train], epoch: 42/50, iter: 200/834, loss: 0.25152, lr: 0.089498, top1: 0.74687, throughput: 313.95 | 2022-04-11 07:03:55.507 [rank:1] [train], epoch: 42/50, iter: 300/834, loss: 0.24946, lr: 0.086807, top1: 0.75010, throughput: 311.97 | 2022-04-11 07:04:57.008 [rank:5] [train], epoch: 42/50, iter: 300/834, loss: 0.25031, lr: 0.086807, top1: 0.74776, throughput: 311.93 | 2022-04-11 07:04:57.015 [rank:4] [train], epoch: 42/50, iter: 300/834, loss: 0.24752, lr: 0.086807, top1: 0.75536, throughput: 311.87 | 2022-04-11 07:04:57.026 [rank:6] [train], epoch: 42/50, iter: 300/834, loss: 0.25126, lr: 0.086807, top1: 0.74594, throughput: 311.55 | 2022-04-11 07:04:57.049 [rank:7] [train], epoch: 42/50, iter: 300/834, loss: 0.24836, lr: 0.086807, top1: 0.75302, throughput: 311.54 | 2022-04-11 07:04:57.057 [rank:3] [train], epoch: 42/50, iter: 300/834, loss: 0.25086, lr: 0.086807, top1: 0.74797, throughput: 311.60 | 2022-04-11 07:04:57.065 [rank:2] [train], epoch: 42/50, iter: 300/834, loss: 0.25114, lr: 0.086807, top1: 0.74437, throughput: 311.85 | 2022-04-11 07:04:57.075 [rank:0] [train], epoch: 42/50, iter: 300/834, loss: 0.25022, lr: 0.086807, top1: 0.75141, throughput: 311.50 | 2022-04-11 07:04:57.094 [rank:1] [train], epoch: 42/50, iter: 400/834, loss: 0.25035, lr: 0.084154, top1: 0.75187, throughput: 312.51 | 2022-04-11 07:05:58.446 [rank:0] [train], epoch: 42/50, iter: 400/834, loss: 0.24990, lr: 0.084154, top1: 0.75026, throughput: 312.91 | 2022-04-11 07:05:58.454 [rank:7] [train], epoch: 42/50, iter: 400/834, loss: 0.25016, lr: 0.084154, top1: 0.74813, throughput: 312.63 | 2022-04-11 07:05:58.471 [rank:2] [train], epoch: 42/50, iter: 400/834, loss: 0.24905, lr: 0.084154, top1: 0.75323, throughput: 312.72 | 2022-04-11 07:05:58.472 [rank:5] [train], epoch: 42/50, iter: 400/834, loss: 0.24952, lr: 0.084154, top1: 0.74901, throughput: 312.41 | 2022-04-11 07:05:58.472 [rank:3] [train], epoch: 42/50, iter: 400/834, loss: 0.24969, lr: 0.084154, top1: 0.74911, throughput: 312.63 | 2022-04-11 07:05:58.480 [rank:6] [train], epoch: 42/50, iter: 400/834, loss: 0.25154, lr: 0.084154, top1: 0.74495, throughput: 312.50 | 2022-04-11 07:05:58.488 [rank:4] [train], epoch: 42/50, iter: 400/834, loss: 0.25037, lr: 0.084154, top1: 0.74833, throughput: 312.20 | 2022-04-11 07:05:58.525 [rank:3] [train], epoch: 42/50, iter: 500/834, loss: 0.24841, lr: 0.081540, top1: 0.75599, throughput: 311.81 | 2022-04-11 07:07:00.056 [rank:5] [train], epoch: 42/50, iter: 500/834, loss: 0.24896, lr: 0.081540, top1: 0.75198, throughput: 311.71 | 2022-04-11 07:07:00.067 [rank:2] [train], epoch: 42/50, iter: 500/834, loss: 0.25072, lr: 0.081540, top1: 0.75083, throughput: 311.64 | 2022-04-11 07:07:00.081 [rank:4] [train], epoch: 42/50, iter: 500/834, loss: 0.24997, lr: 0.081540, top1: 0.74927, throughput: 311.91 | 2022-04-11 07:07:00.082 [rank:6] [train], epoch: 42/50, iter: 500/834, loss: 0.25187, lr: 0.081540, top1: 0.74333, throughput: 311.65 | 2022-04-11 07:07:00.096 [rank:1] [train], epoch: 42/50, iter: 500/834, loss: 0.24945, lr: 0.081540, top1: 0.74932, throughput: 311.34 | 2022-04-11 07:07:00.115 [rank:0] [train], epoch: 42/50, iter: 500/834, loss: 0.25069, lr: 0.081540, top1: 0.74870, throughput: 311.30 | 2022-04-11 07:07:00.130 [rank:7] [train], epoch: 42/50, iter: 500/834, loss: 0.24964, lr: 0.081540, top1: 0.75078, throughput: 311.76 | 2022-04-11 07:07:00.056 [rank:2] [train], epoch: 42/50, iter: 600/834, loss: 0.25216, lr: 0.078965, top1: 0.74724, throughput: 313.28 | 2022-04-11 07:08:01.368 [rank:5] [train], epoch: 42/50, iter: 600/834, loss: 0.24968, lr: 0.078965, top1: 0.75109, throughput: 313.02 | 2022-04-11 07:08:01.405 [rank:4] [train], epoch: 42/50, iter: 600/834, loss: 0.24992, lr: 0.078965, top1: 0.74677, throughput: 313.05 | 2022-04-11 07:08:01.413 [rank:1] [train], epoch: 42/50, iter: 600/834, loss: 0.25097, lr: 0.078965, top1: 0.74604, throughput: 313.16 | 2022-04-11 07:08:01.427 [rank:6] [train], epoch: 42/50, iter: 600/834, loss: 0.24926, lr: 0.078965, top1: 0.75214, throughput: 313.01 | 2022-04-11 07:08:01.436 [rank:0] [train], epoch: 42/50, iter: 600/834, loss: 0.24866, lr: 0.078965, top1: 0.74990, throughput: 313.14 | 2022-04-11 07:08:01.446 [rank:3] [train], epoch: 42/50, iter: 600/834, loss: 0.25312, lr: 0.078965, top1: 0.74161, throughput: 312.70 | 2022-04-11 07:08:01.457 [rank:7] [train], epoch: 42/50, iter: 600/834, loss: 0.25123, lr: 0.078965, top1: 0.74474, throughput: 313.10 | 2022-04-11 07:08:01.378 [rank:0] [train], epoch: 42/50, iter: 700/834, loss: 0.25155, lr: 0.076429, top1: 0.74406, throughput: 313.29 | 2022-04-11 07:09:02.732 [rank:6] [train], epoch: 42/50, iter: 700/834, loss: 0.25097, lr: 0.076429, top1: 0.74687, throughput: 313.18 | 2022-04-11 07:09:02.742 [rank:7] [train], epoch: 42/50, iter: 700/834, loss: 0.25014, lr: 0.076429, top1: 0.75000, throughput: 312.83 | 2022-04-11 07:09:02.753 [rank:4] [train], epoch: 42/50, iter: 700/834, loss: 0.25063, lr: 0.076429, top1: 0.74760, throughput: 312.96 | 2022-04-11 07:09:02.763 [rank:5] [train], epoch: 42/50, iter: 700/834, loss: 0.24800, lr: 0.076429, top1: 0.75411, throughput: 312.91 | 2022-04-11 07:09:02.765 [rank:2] [train], epoch: 42/50, iter: 700/834, loss: 0.25110, lr: 0.076429, top1: 0.75052, throughput: 312.71 | 2022-04-11 07:09:02.768 [rank:1] [train], epoch: 42/50, iter: 700/834, loss: 0.24988, lr: 0.076429, top1: 0.74818, throughput: 312.89 | 2022-04-11 07:09:02.789 [rank:3] [train], epoch: 42/50, iter: 700/834, loss: 0.25012, lr: 0.076429, top1: 0.74547, throughput: 312.97 | 2022-04-11 07:09:02.805 [rank:5] [train], epoch: 42/50, iter: 800/834, loss: 0.25020, lr: 0.073933, top1: 0.74693, throughput: 313.47 | 2022-04-11 07:10:04.015 [rank:1] [train], epoch: 42/50, iter: 800/834, loss: 0.24937, lr: 0.073933, top1: 0.75365, throughput: 313.53 | 2022-04-11 07:10:04.027 [rank:0] [train], epoch: 42/50, iter: 800/834, loss: 0.24925, lr: 0.073933, top1: 0.74896, throughput: 313.19 | 2022-04-11 07:10:04.037 [rank:6] [train], epoch: 42/50, iter: 800/834, loss: 0.25007, lr: 0.073933, top1: 0.74839, throughput: 313.18 | 2022-04-11 07:10:04.048 [rank:4] [train], epoch: 42/50, iter: 800/834, loss: 0.25130, lr: 0.073933, top1: 0.74583, throughput: 313.23 | 2022-04-11 07:10:04.061 [rank:7] [train], epoch: 42/50, iter: 800/834, loss: 0.24751, lr: 0.073933, top1: 0.75557, throughput: 313.04 | 2022-04-11 07:10:04.087 [rank:3] [train], epoch: 42/50, iter: 800/834, loss: 0.25020, lr: 0.073933, top1: 0.74688, throughput: 313.26 | 2022-04-11 07:10:04.097 [rank:2] [train], epoch: 42/50, iter: 800/834, loss: 0.25072, lr: 0.073933, top1: 0.74922, throughput: 313.04 | 2022-04-11 07:10:04.102 [rank:2] [train], epoch: 42/50, iter: 834/834, loss: 0.24635, lr: 0.073093, top1: 0.75751, throughput: 314.46 | 2022-04-11 07:10:24.862 [rank:0] [train], epoch: 42/50, iter: 834/834, loss: 0.25052, lr: 0.073093, top1: 0.74173, throughput: 312.55 | 2022-04-11 07:10:24.923 [rank:5] [train], epoch: 42/50, iter: 834/834, loss: 0.24861, lr: 0.073093, top1: 0.75153, throughput: 312.16 | 2022-04-11 07:10:24.928 [rank:4] [train], epoch: 42/50, iter: 834/834, loss: 0.25265, lr: 0.073093, top1: 0.74464, throughput: 312.79 | 2022-04-11 07:10:24.931 [rank:7] [train], epoch: 42/50, iter: 834/834, loss: 0.24786, lr: 0.073093, top1: 0.75123, throughput: 313.09 | 2022-04-11 07:10:24.937 [rank:6] [train], epoch: 42/50, iter: 834/834, loss: 0.24763, lr: 0.073093, top1: 0.74893, throughput: 312.44 | 2022-04-11 07:10:24.942 [rank:3] [train], epoch: 42/50, iter: 834/834, loss: 0.25119, lr: 0.073093, top1: 0.74127, throughput: 313.00 | 2022-04-11 07:10:24.953 [rank:1] [train], epoch: 42/50, iter: 834/834, loss: 0.24864, lr: 0.073093, top1: 0.75138, throughput: 311.73 | 2022-04-11 07:10:24.968 [rank:0] [eval], epoch: 42/50, iter: 125/125, loss: 0.00000, lr: 0.073093, top1: 0.74288, throughput: 485.39 | 2022-04-11 07:10:37.800 [rank:1] [eval], epoch: 42/50, iter: 125/125, loss: 0.00000, lr: 0.073093, top1: 0.75088, throughput: 487.09 | 2022-04-11 07:10:37.800 [rank:2] [eval], epoch: 42/50, iter: 125/125, loss: 0.00000, lr: 0.073093, top1: 0.73600, throughput: 482.42 | 2022-04-11 07:10:37.817 [rank:3] [eval], epoch: 42/50, iter: 125/125, loss: 0.00000, lr: 0.073093, top1: 0.74400, throughput: 485.83 | 2022-04-11 07:10:37.818 [rank:4] [eval], epoch: 42/50, iter: 125/125, loss: 0.00000, lr: 0.073093, top1: 0.74688, throughput: 484.95 | 2022-04-11 07:10:37.819 [rank:7] [eval], epoch: 42/50, iter: 125/125, loss: 0.00000, lr: 0.073093, top1: 0.74992, throughput: 485.19 | 2022-04-11 07:10:37.818 [rank:6] [eval], epoch: 42/50, iter: 125/125, loss: 0.00000, lr: 0.073093, top1: 0.74912, throughput: 484.70 | 2022-04-11 07:10:37.837 [rank:5] [eval], epoch: 42/50, iter: 125/125, loss: 0.00000, lr: 0.073093, top1: 0.74224, throughput: 483.59 | 2022-04-11 07:10:37.852 [rank:4] [train], epoch: 43/50, iter: 100/834, loss: 0.24669, lr: 0.070649, top1: 0.75453, throughput: 313.67 | 2022-04-11 07:11:39.030 [rank:1] [train], epoch: 43/50, iter: 100/834, loss: 0.24570, lr: 0.070649, top1: 0.75911, throughput: 313.54 | 2022-04-11 07:11:39.036 [rank:0] [train], epoch: 43/50, iter: 100/834, loss: 0.24673, lr: 0.070649, top1: 0.75990, throughput: 313.51 | 2022-04-11 07:11:39.041 [rank:3] [train], epoch: 43/50, iter: 100/834, loss: 0.24393, lr: 0.070649, top1: 0.76406, throughput: 313.46 | 2022-04-11 07:11:39.069 [rank:2] [train], epoch: 43/50, iter: 100/834, loss: 0.24587, lr: 0.070649, top1: 0.75969, throughput: 313.36 | 2022-04-11 07:11:39.088 [rank:7] [train], epoch: 43/50, iter: 100/834, loss: 0.24646, lr: 0.070649, top1: 0.75562, throughput: 313.33 | 2022-04-11 07:11:39.096 [rank:6] [train], epoch: 43/50, iter: 100/834, loss: 0.24343, lr: 0.070649, top1: 0.76333, throughput: 313.38 | 2022-04-11 07:11:39.105 [rank:5] [train], epoch: 43/50, iter: 100/834, loss: 0.24419, lr: 0.070649, top1: 0.76125, throughput: 313.33 | 2022-04-11 07:11:39.129 [rank:3] [train], epoch: 43/50, iter: 200/834, loss: 0.24546, lr: 0.068245, top1: 0.75740, throughput: 312.40 | 2022-04-11 07:12:40.530 [rank:2] [train], epoch: 43/50, iter: 200/834, loss: 0.24622, lr: 0.068245, top1: 0.76214, throughput: 312.44 | 2022-04-11 07:12:40.540 [rank:7] [train], epoch: 43/50, iter: 200/834, loss: 0.24243, lr: 0.068245, top1: 0.76359, throughput: 312.47 | 2022-04-11 07:12:40.541 [rank:5] [train], epoch: 43/50, iter: 200/834, loss: 0.24670, lr: 0.068245, top1: 0.75760, throughput: 312.63 | 2022-04-11 07:12:40.543 [rank:0] [train], epoch: 43/50, iter: 200/834, loss: 0.24409, lr: 0.068245, top1: 0.76078, throughput: 312.14 | 2022-04-11 07:12:40.551 [rank:6] [train], epoch: 43/50, iter: 200/834, loss: 0.24501, lr: 0.068245, top1: 0.76307, throughput: 312.36 | 2022-04-11 07:12:40.573 [rank:4] [train], epoch: 43/50, iter: 200/834, loss: 0.24664, lr: 0.068245, top1: 0.75677, throughput: 311.89 | 2022-04-11 07:12:40.591 [rank:1] [train], epoch: 43/50, iter: 200/834, loss: 0.24546, lr: 0.068245, top1: 0.75870, throughput: 311.60 | 2022-04-11 07:12:40.653 [rank:7] [train], epoch: 43/50, iter: 300/834, loss: 0.24598, lr: 0.065880, top1: 0.75984, throughput: 312.93 | 2022-04-11 07:13:41.897 [rank:0] [train], epoch: 43/50, iter: 300/834, loss: 0.24551, lr: 0.065880, top1: 0.75896, throughput: 312.95 | 2022-04-11 07:13:41.903 [rank:5] [train], epoch: 43/50, iter: 300/834, loss: 0.24626, lr: 0.065880, top1: 0.75932, throughput: 312.84 | 2022-04-11 07:13:41.916 [rank:2] [train], epoch: 43/50, iter: 300/834, loss: 0.24523, lr: 0.065880, top1: 0.75807, throughput: 312.82 | 2022-04-11 07:13:41.918 [rank:6] [train], epoch: 43/50, iter: 300/834, loss: 0.24715, lr: 0.065880, top1: 0.75453, throughput: 312.89 | 2022-04-11 07:13:41.936 [rank:4] [train], epoch: 43/50, iter: 300/834, loss: 0.24687, lr: 0.065880, top1: 0.76021, throughput: 312.94 | 2022-04-11 07:13:41.944 [rank:3] [train], epoch: 43/50, iter: 300/834, loss: 0.24651, lr: 0.065880, top1: 0.75672, throughput: 312.47 | 2022-04-11 07:13:41.975 [rank:1] [train], epoch: 43/50, iter: 300/834, loss: 0.24474, lr: 0.065880, top1: 0.76026, throughput: 313.43 | 2022-04-11 07:13:41.911 [rank:2] [train], epoch: 43/50, iter: 400/834, loss: 0.24731, lr: 0.063556, top1: 0.75573, throughput: 312.10 | 2022-04-11 07:14:43.437 [rank:0] [train], epoch: 43/50, iter: 400/834, loss: 0.24382, lr: 0.063556, top1: 0.76068, throughput: 311.71 | 2022-04-11 07:14:43.497 [rank:6] [train], epoch: 43/50, iter: 400/834, loss: 0.24612, lr: 0.063556, top1: 0.75568, throughput: 311.74 | 2022-04-11 07:14:43.527 [rank:7] [train], epoch: 43/50, iter: 400/834, loss: 0.24541, lr: 0.063556, top1: 0.76266, throughput: 311.48 | 2022-04-11 07:14:43.539 [rank:3] [train], epoch: 43/50, iter: 400/834, loss: 0.24693, lr: 0.063556, top1: 0.75516, throughput: 311.80 | 2022-04-11 07:14:43.553 [rank:4] [train], epoch: 43/50, iter: 400/834, loss: 0.24456, lr: 0.063556, top1: 0.75828, throughput: 311.57 | 2022-04-11 07:14:43.568 [rank:5] [train], epoch: 43/50, iter: 400/834, loss: 0.24487, lr: 0.063556, top1: 0.75797, throughput: 311.42 | 2022-04-11 07:14:43.569 [rank:1] [train], epoch: 43/50, iter: 400/834, loss: 0.24737, lr: 0.063556, top1: 0.75464, throughput: 311.29 | 2022-04-11 07:14:43.591 [rank:5] [train], epoch: 43/50, iter: 500/834, loss: 0.24650, lr: 0.061271, top1: 0.75766, throughput: 313.07 | 2022-04-11 07:15:44.898 [rank:0] [train], epoch: 43/50, iter: 500/834, loss: 0.24470, lr: 0.061271, top1: 0.76240, throughput: 312.57 | 2022-04-11 07:15:44.924 [rank:4] [train], epoch: 43/50, iter: 500/834, loss: 0.24710, lr: 0.061271, top1: 0.75333, throughput: 312.86 | 2022-04-11 07:15:44.939 [rank:1] [train], epoch: 43/50, iter: 500/834, loss: 0.24611, lr: 0.061271, top1: 0.75750, throughput: 312.94 | 2022-04-11 07:15:44.944 [rank:2] [train], epoch: 43/50, iter: 500/834, loss: 0.24589, lr: 0.061271, top1: 0.75573, throughput: 312.14 | 2022-04-11 07:15:44.949 [rank:7] [train], epoch: 43/50, iter: 500/834, loss: 0.24587, lr: 0.061271, top1: 0.75865, throughput: 312.59 | 2022-04-11 07:15:44.961 [rank:6] [train], epoch: 43/50, iter: 500/834, loss: 0.24489, lr: 0.061271, top1: 0.75875, throughput: 312.92 | 2022-04-11 07:15:44.884 [rank:3] [train], epoch: 43/50, iter: 500/834, loss: 0.24486, lr: 0.061271, top1: 0.75615, throughput: 312.49 | 2022-04-11 07:15:44.994 [rank:1] [train], epoch: 43/50, iter: 600/834, loss: 0.24650, lr: 0.059026, top1: 0.75620, throughput: 313.12 | 2022-04-11 07:16:46.262 [rank:3] [train], epoch: 43/50, iter: 600/834, loss: 0.24543, lr: 0.059026, top1: 0.76005, throughput: 313.31 | 2022-04-11 07:16:46.275 [rank:2] [train], epoch: 43/50, iter: 600/834, loss: 0.24670, lr: 0.059026, top1: 0.75505, throughput: 312.97 | 2022-04-11 07:16:46.296 [rank:0] [train], epoch: 43/50, iter: 600/834, loss: 0.24580, lr: 0.059026, top1: 0.75682, throughput: 312.82 | 2022-04-11 07:16:46.301 [rank:5] [train], epoch: 43/50, iter: 600/834, loss: 0.24498, lr: 0.059026, top1: 0.76156, throughput: 312.66 | 2022-04-11 07:16:46.307 [rank:6] [train], epoch: 43/50, iter: 600/834, loss: 0.24679, lr: 0.059026, top1: 0.75318, throughput: 312.45 | 2022-04-11 07:16:46.333 [rank:4] [train], epoch: 43/50, iter: 600/834, loss: 0.24442, lr: 0.059026, top1: 0.76063, throughput: 312.73 | 2022-04-11 07:16:46.334 [rank:7] [train], epoch: 43/50, iter: 600/834, loss: 0.24662, lr: 0.059026, top1: 0.75745, throughput: 312.84 | 2022-04-11 07:16:46.335 [rank:0] [train], epoch: 43/50, iter: 700/834, loss: 0.24561, lr: 0.056822, top1: 0.75979, throughput: 312.00 | 2022-04-11 07:17:47.839 [rank:7] [train], epoch: 43/50, iter: 700/834, loss: 0.24845, lr: 0.056822, top1: 0.75297, throughput: 312.07 | 2022-04-11 07:17:47.859 [rank:1] [train], epoch: 43/50, iter: 700/834, loss: 0.24573, lr: 0.056822, top1: 0.75953, throughput: 311.65 | 2022-04-11 07:17:47.871 [rank:2] [train], epoch: 43/50, iter: 700/834, loss: 0.24344, lr: 0.056822, top1: 0.76203, throughput: 311.63 | 2022-04-11 07:17:47.907 [rank:6] [train], epoch: 43/50, iter: 700/834, loss: 0.24668, lr: 0.056822, top1: 0.75755, throughput: 311.81 | 2022-04-11 07:17:47.909 [rank:4] [train], epoch: 43/50, iter: 700/834, loss: 0.24545, lr: 0.056822, top1: 0.75719, throughput: 311.75 | 2022-04-11 07:17:47.922 [rank:3] [train], epoch: 43/50, iter: 700/834, loss: 0.24600, lr: 0.056822, top1: 0.75635, throughput: 311.42 | 2022-04-11 07:17:47.927 [rank:5] [train], epoch: 43/50, iter: 700/834, loss: 0.24439, lr: 0.056822, top1: 0.75859, throughput: 311.96 | 2022-04-11 07:17:47.854 [rank:5] [train], epoch: 43/50, iter: 800/834, loss: 0.24701, lr: 0.054658, top1: 0.75286, throughput: 314.37 | 2022-04-11 07:18:48.929 [rank:6] [train], epoch: 43/50, iter: 800/834, loss: 0.24652, lr: 0.054658, top1: 0.75578, throughput: 314.65 | 2022-04-11 07:18:48.930 [rank:0] [train], epoch: 43/50, iter: 800/834, loss: 0.24631, lr: 0.054658, top1: 0.75870, throughput: 314.12 | 2022-04-11 07:18:48.961 [rank:1] [train], epoch: 43/50, iter: 800/834, loss: 0.24697, lr: 0.054658, top1: 0.75641, throughput: 314.27 | 2022-04-11 07:18:48.964 [rank:3] [train], epoch: 43/50, iter: 800/834, loss: 0.24737, lr: 0.054658, top1: 0.75417, throughput: 314.55 | 2022-04-11 07:18:48.967 [rank:2] [train], epoch: 43/50, iter: 800/834, loss: 0.24686, lr: 0.054658, top1: 0.75672, throughput: 314.42 | 2022-04-11 07:18:48.973 [rank:4] [train], epoch: 43/50, iter: 800/834, loss: 0.24684, lr: 0.054658, top1: 0.75760, throughput: 314.44 | 2022-04-11 07:18:48.982 [rank:7] [train], epoch: 43/50, iter: 800/834, loss: 0.24480, lr: 0.054658, top1: 0.75885, throughput: 314.10 | 2022-04-11 07:18:48.987 [rank:6] [train], epoch: 43/50, iter: 834/834, loss: 0.24660, lr: 0.053932, top1: 0.75444, throughput: 314.76 | 2022-04-11 07:19:09.670 [rank:5] [train], epoch: 43/50, iter: 834/834, loss: 0.24771, lr: 0.053932, top1: 0.75475, throughput: 314.72 | 2022-04-11 07:19:09.672 [rank:2] [train], epoch: 43/50, iter: 834/834, loss: 0.24476, lr: 0.053932, top1: 0.75904, throughput: 315.34 | 2022-04-11 07:19:09.674 [rank:7] [train], epoch: 43/50, iter: 834/834, loss: 0.24694, lr: 0.053932, top1: 0.75444, throughput: 315.50 | 2022-04-11 07:19:09.677 [rank:0] [train], epoch: 43/50, iter: 834/834, loss: 0.24445, lr: 0.053932, top1: 0.76746, throughput: 314.97 | 2022-04-11 07:19:09.687 [rank:3] [train], epoch: 43/50, iter: 834/834, loss: 0.24781, lr: 0.053932, top1: 0.74939, throughput: 315.05 | 2022-04-11 07:19:09.688 [rank:4] [train], epoch: 43/50, iter: 834/834, loss: 0.24896, lr: 0.053932, top1: 0.75184, throughput: 315.20 | 2022-04-11 07:19:09.693 [rank:1] [train], epoch: 43/50, iter: 834/834, loss: 0.24338, lr: 0.053932, top1: 0.76256, throughput: 314.85 | 2022-04-11 07:19:09.698 [rank:0] [eval], epoch: 43/50, iter: 125/125, loss: 0.00000, lr: 0.053932, top1: 0.74720, throughput: 486.68 | 2022-04-11 07:19:22.529 [rank:1] [eval], epoch: 43/50, iter: 125/125, loss: 0.00000, lr: 0.053932, top1: 0.75456, throughput: 486.85 | 2022-04-11 07:19:22.536 [rank:2] [eval], epoch: 43/50, iter: 125/125, loss: 0.00000, lr: 0.053932, top1: 0.73792, throughput: 485.73 | 2022-04-11 07:19:22.541 [rank:3] [eval], epoch: 43/50, iter: 125/125, loss: 0.00000, lr: 0.053932, top1: 0.74272, throughput: 486.25 | 2022-04-11 07:19:22.541 [rank:4] [eval], epoch: 43/50, iter: 125/125, loss: 0.00000, lr: 0.053932, top1: 0.74656, throughput: 486.00 | 2022-04-11 07:19:22.553 [rank:5] [eval], epoch: 43/50, iter: 125/125, loss: 0.00000, lr: 0.053932, top1: 0.74576, throughput: 484.76 | 2022-04-11 07:19:22.564 [rank:7] [eval], epoch: 43/50, iter: 125/125, loss: 0.00000, lr: 0.053932, top1: 0.74944, throughput: 484.97 | 2022-04-11 07:19:22.565 [rank:6] [eval], epoch: 43/50, iter: 125/125, loss: 0.00000, lr: 0.053932, top1: 0.75120, throughput: 483.87 | 2022-04-11 07:19:22.586 [rank:2] [train], epoch: 44/50, iter: 100/834, loss: 0.24319, lr: 0.051822, top1: 0.76260, throughput: 311.49 | 2022-04-11 07:20:24.181 [rank:7] [train], epoch: 44/50, iter: 100/834, loss: 0.24320, lr: 0.051822, top1: 0.76318, throughput: 311.45 | 2022-04-11 07:20:24.212 [rank:3] [train], epoch: 44/50, iter: 100/834, loss: 0.24205, lr: 0.051822, top1: 0.76375, throughput: 311.33 | 2022-04-11 07:20:24.213 [rank:1] [train], epoch: 44/50, iter: 100/834, loss: 0.24119, lr: 0.051822, top1: 0.76714, throughput: 311.29 | 2022-04-11 07:20:24.215 [rank:5] [train], epoch: 44/50, iter: 100/834, loss: 0.24273, lr: 0.051822, top1: 0.76271, throughput: 311.34 | 2022-04-11 07:20:24.232 [rank:4] [train], epoch: 44/50, iter: 100/834, loss: 0.24205, lr: 0.051822, top1: 0.76630, throughput: 311.23 | 2022-04-11 07:20:24.243 [rank:6] [train], epoch: 44/50, iter: 100/834, loss: 0.24405, lr: 0.051822, top1: 0.76021, throughput: 311.31 | 2022-04-11 07:20:24.261 [rank:0] [train], epoch: 44/50, iter: 100/834, loss: 0.23950, lr: 0.051822, top1: 0.77479, throughput: 310.95 | 2022-04-11 07:20:24.276 [rank:5] [train], epoch: 44/50, iter: 200/834, loss: 0.24256, lr: 0.049753, top1: 0.76745, throughput: 313.01 | 2022-04-11 07:21:25.572 [rank:0] [train], epoch: 44/50, iter: 200/834, loss: 0.24072, lr: 0.049753, top1: 0.76854, throughput: 313.06 | 2022-04-11 07:21:25.606 [rank:4] [train], epoch: 44/50, iter: 200/834, loss: 0.24442, lr: 0.049753, top1: 0.76234, throughput: 312.78 | 2022-04-11 07:21:25.628 [rank:3] [train], epoch: 44/50, iter: 200/834, loss: 0.24235, lr: 0.049753, top1: 0.76469, throughput: 312.59 | 2022-04-11 07:21:25.635 [rank:7] [train], epoch: 44/50, iter: 200/834, loss: 0.23952, lr: 0.049753, top1: 0.77151, throughput: 312.52 | 2022-04-11 07:21:25.647 [rank:6] [train], epoch: 44/50, iter: 200/834, loss: 0.24157, lr: 0.049753, top1: 0.76922, throughput: 312.60 | 2022-04-11 07:21:25.682 [rank:1] [train], epoch: 44/50, iter: 200/834, loss: 0.24108, lr: 0.049753, top1: 0.77005, throughput: 312.32 | 2022-04-11 07:21:25.689 [rank:2] [train], epoch: 44/50, iter: 200/834, loss: 0.24080, lr: 0.049753, top1: 0.76630, throughput: 312.35 | 2022-04-11 07:21:25.650 [rank:5] [train], epoch: 44/50, iter: 300/834, loss: 0.24055, lr: 0.047725, top1: 0.77047, throughput: 312.91 | 2022-04-11 07:22:26.931 [rank:4] [train], epoch: 44/50, iter: 300/834, loss: 0.24246, lr: 0.047725, top1: 0.76401, throughput: 313.00 | 2022-04-11 07:22:26.971 [rank:6] [train], epoch: 44/50, iter: 300/834, loss: 0.24058, lr: 0.047725, top1: 0.77010, throughput: 313.21 | 2022-04-11 07:22:26.982 [rank:1] [train], epoch: 44/50, iter: 300/834, loss: 0.24179, lr: 0.047725, top1: 0.76734, throughput: 313.24 | 2022-04-11 07:22:26.984 [rank:0] [train], epoch: 44/50, iter: 300/834, loss: 0.24217, lr: 0.047725, top1: 0.76599, throughput: 312.81 | 2022-04-11 07:22:26.985 [rank:2] [train], epoch: 44/50, iter: 300/834, loss: 0.24539, lr: 0.047725, top1: 0.75677, throughput: 313.01 | 2022-04-11 07:22:26.990 [rank:7] [train], epoch: 44/50, iter: 300/834, loss: 0.24410, lr: 0.047725, top1: 0.75807, throughput: 312.93 | 2022-04-11 07:22:27.003 [rank:3] [train], epoch: 44/50, iter: 300/834, loss: 0.24254, lr: 0.047725, top1: 0.76385, throughput: 312.82 | 2022-04-11 07:22:27.012 [rank:5] [train], epoch: 44/50, iter: 400/834, loss: 0.24388, lr: 0.045737, top1: 0.76516, throughput: 311.85 | 2022-04-11 07:23:28.499 [rank:4] [train], epoch: 44/50, iter: 400/834, loss: 0.24168, lr: 0.045737, top1: 0.76771, throughput: 311.96 | 2022-04-11 07:23:28.518 [rank:2] [train], epoch: 44/50, iter: 400/834, loss: 0.24208, lr: 0.045737, top1: 0.76490, throughput: 311.95 | 2022-04-11 07:23:28.539 [rank:7] [train], epoch: 44/50, iter: 400/834, loss: 0.24206, lr: 0.045737, top1: 0.76599, throughput: 311.99 | 2022-04-11 07:23:28.543 [rank:6] [train], epoch: 44/50, iter: 400/834, loss: 0.24108, lr: 0.045737, top1: 0.77042, throughput: 311.82 | 2022-04-11 07:23:28.556 [rank:0] [train], epoch: 44/50, iter: 400/834, loss: 0.24180, lr: 0.045737, top1: 0.76552, throughput: 311.75 | 2022-04-11 07:23:28.572 [rank:3] [train], epoch: 44/50, iter: 400/834, loss: 0.24092, lr: 0.045737, top1: 0.76688, throughput: 311.82 | 2022-04-11 07:23:28.586 [rank:1] [train], epoch: 44/50, iter: 400/834, loss: 0.24301, lr: 0.045737, top1: 0.76568, throughput: 311.67 | 2022-04-11 07:23:28.587 [rank:2] [train], epoch: 44/50, iter: 500/834, loss: 0.24334, lr: 0.043791, top1: 0.76391, throughput: 313.39 | 2022-04-11 07:24:29.805 [rank:5] [train], epoch: 44/50, iter: 500/834, loss: 0.24344, lr: 0.043791, top1: 0.76724, throughput: 313.09 | 2022-04-11 07:24:29.824 [rank:3] [train], epoch: 44/50, iter: 500/834, loss: 0.24329, lr: 0.043791, top1: 0.76370, throughput: 313.47 | 2022-04-11 07:24:29.836 [rank:0] [train], epoch: 44/50, iter: 500/834, loss: 0.24167, lr: 0.043791, top1: 0.76755, throughput: 313.36 | 2022-04-11 07:24:29.844 [rank:6] [train], epoch: 44/50, iter: 500/834, loss: 0.24141, lr: 0.043791, top1: 0.76479, throughput: 313.25 | 2022-04-11 07:24:29.849 [rank:4] [train], epoch: 44/50, iter: 500/834, loss: 0.24481, lr: 0.043791, top1: 0.75812, throughput: 313.05 | 2022-04-11 07:24:29.850 [rank:7] [train], epoch: 44/50, iter: 500/834, loss: 0.24390, lr: 0.043791, top1: 0.76458, throughput: 313.47 | 2022-04-11 07:24:29.793 [rank:1] [train], epoch: 44/50, iter: 500/834, loss: 0.24347, lr: 0.043791, top1: 0.76781, throughput: 313.61 | 2022-04-11 07:24:29.811 [rank:6] [train], epoch: 44/50, iter: 600/834, loss: 0.24223, lr: 0.041886, top1: 0.76557, throughput: 314.07 | 2022-04-11 07:25:30.983 [rank:4] [train], epoch: 44/50, iter: 600/834, loss: 0.24413, lr: 0.041886, top1: 0.75958, throughput: 313.93 | 2022-04-11 07:25:31.010 [rank:5] [train], epoch: 44/50, iter: 600/834, loss: 0.24193, lr: 0.041886, top1: 0.76422, throughput: 313.71 | 2022-04-11 07:25:31.027 [rank:0] [train], epoch: 44/50, iter: 600/834, loss: 0.24323, lr: 0.041886, top1: 0.76792, throughput: 313.67 | 2022-04-11 07:25:31.056 [rank:7] [train], epoch: 44/50, iter: 600/834, loss: 0.24272, lr: 0.041886, top1: 0.76932, throughput: 313.40 | 2022-04-11 07:25:31.056 [rank:2] [train], epoch: 44/50, iter: 600/834, loss: 0.24085, lr: 0.041886, top1: 0.76677, throughput: 313.46 | 2022-04-11 07:25:31.057 [rank:3] [train], epoch: 44/50, iter: 600/834, loss: 0.24078, lr: 0.041886, top1: 0.76974, throughput: 313.61 | 2022-04-11 07:25:31.058 [rank:1] [train], epoch: 44/50, iter: 600/834, loss: 0.24206, lr: 0.041886, top1: 0.76625, throughput: 313.28 | 2022-04-11 07:25:31.098 [rank:4] [train], epoch: 44/50, iter: 700/834, loss: 0.24292, lr: 0.040022, top1: 0.76740, throughput: 313.44 | 2022-04-11 07:26:32.266 [rank:6] [train], epoch: 44/50, iter: 700/834, loss: 0.24350, lr: 0.040022, top1: 0.76443, throughput: 313.14 | 2022-04-11 07:26:32.297 [rank:2] [train], epoch: 44/50, iter: 700/834, loss: 0.24354, lr: 0.040022, top1: 0.76641, throughput: 313.40 | 2022-04-11 07:26:32.320 [rank:3] [train], epoch: 44/50, iter: 700/834, loss: 0.24299, lr: 0.040022, top1: 0.76495, throughput: 313.40 | 2022-04-11 07:26:32.322 [rank:5] [train], epoch: 44/50, iter: 700/834, loss: 0.24210, lr: 0.040022, top1: 0.76698, throughput: 313.16 | 2022-04-11 07:26:32.338 [rank:7] [train], epoch: 44/50, iter: 700/834, loss: 0.24253, lr: 0.040022, top1: 0.76698, throughput: 313.24 | 2022-04-11 07:26:32.350 [rank:0] [train], epoch: 44/50, iter: 700/834, loss: 0.24094, lr: 0.040022, top1: 0.77109, throughput: 313.24 | 2022-04-11 07:26:32.351 [rank:1] [train], epoch: 44/50, iter: 700/834, loss: 0.24217, lr: 0.040022, top1: 0.76411, throughput: 313.44 | 2022-04-11 07:26:32.353 [rank:4] [train], epoch: 44/50, iter: 800/834, loss: 0.24053, lr: 0.038199, top1: 0.77021, throughput: 312.83 | 2022-04-11 07:27:33.642 [rank:1] [train], epoch: 44/50, iter: 800/834, loss: 0.24215, lr: 0.038199, top1: 0.76604, throughput: 313.01 | 2022-04-11 07:27:33.692 [rank:6] [train], epoch: 44/50, iter: 800/834, loss: 0.24101, lr: 0.038199, top1: 0.76812, throughput: 312.72 | 2022-04-11 07:27:33.694 [rank:7] [train], epoch: 44/50, iter: 800/834, loss: 0.24198, lr: 0.038199, top1: 0.76615, throughput: 312.87 | 2022-04-11 07:27:33.717 [rank:0] [train], epoch: 44/50, iter: 800/834, loss: 0.24136, lr: 0.038199, top1: 0.77104, throughput: 312.84 | 2022-04-11 07:27:33.724 [rank:2] [train], epoch: 44/50, iter: 800/834, loss: 0.24016, lr: 0.038199, top1: 0.76958, throughput: 312.66 | 2022-04-11 07:27:33.728 [rank:3] [train], epoch: 44/50, iter: 800/834, loss: 0.24100, lr: 0.038199, top1: 0.76625, throughput: 312.65 | 2022-04-11 07:27:33.732 [rank:5] [train], epoch: 44/50, iter: 800/834, loss: 0.24157, lr: 0.038199, top1: 0.76672, throughput: 312.39 | 2022-04-11 07:27:33.799 [rank:6] [train], epoch: 44/50, iter: 834/834, loss: 0.24191, lr: 0.037589, top1: 0.76685, throughput: 311.84 | 2022-04-11 07:27:54.628 [rank:2] [train], epoch: 44/50, iter: 834/834, loss: 0.24116, lr: 0.037589, top1: 0.76578, throughput: 312.17 | 2022-04-11 07:27:54.640 [rank:7] [train], epoch: 44/50, iter: 834/834, loss: 0.23700, lr: 0.037589, top1: 0.77865, throughput: 311.95 | 2022-04-11 07:27:54.643 [rank:3] [train], epoch: 44/50, iter: 834/834, loss: 0.24413, lr: 0.037589, top1: 0.75643, throughput: 312.06 | 2022-04-11 07:27:54.651 [rank:4] [train], epoch: 44/50, iter: 834/834, loss: 0.24161, lr: 0.037589, top1: 0.76731, throughput: 310.46 | 2022-04-11 07:27:54.669 [rank:0] [train], epoch: 44/50, iter: 834/834, loss: 0.24056, lr: 0.037589, top1: 0.76808, throughput: 311.66 | 2022-04-11 07:27:54.670 [rank:5] [train], epoch: 44/50, iter: 834/834, loss: 0.24130, lr: 0.037589, top1: 0.76057, throughput: 312.58 | 2022-04-11 07:27:54.684 [rank:1] [train], epoch: 44/50, iter: 834/834, loss: 0.24234, lr: 0.037589, top1: 0.76854, throughput: 310.89 | 2022-04-11 07:27:54.690 [rank:0] [eval], epoch: 44/50, iter: 125/125, loss: 0.00000, lr: 0.037589, top1: 0.75280, throughput: 485.35 | 2022-04-11 07:28:07.547 [rank:2] [eval], epoch: 44/50, iter: 125/125, loss: 0.00000, lr: 0.037589, top1: 0.74544, throughput: 483.71 | 2022-04-11 07:28:07.561 [rank:1] [eval], epoch: 44/50, iter: 125/125, loss: 0.00000, lr: 0.037589, top1: 0.75792, throughput: 485.42 | 2022-04-11 07:28:07.565 [rank:5] [eval], epoch: 44/50, iter: 125/125, loss: 0.00000, lr: 0.037589, top1: 0.75072, throughput: 485.11 | 2022-04-11 07:28:07.567 [rank:4] [eval], epoch: 44/50, iter: 125/125, loss: 0.00000, lr: 0.037589, top1: 0.74832, throughput: 484.51 | 2022-04-11 07:28:07.568 [rank:7] [eval], epoch: 44/50, iter: 125/125, loss: 0.00000, lr: 0.037589, top1: 0.76352, throughput: 483.29 | 2022-04-11 07:28:07.576 [rank:3] [eval], epoch: 44/50, iter: 125/125, loss: 0.00000, lr: 0.037589, top1: 0.75376, throughput: 483.54 | 2022-04-11 07:28:07.576 [rank:6] [eval], epoch: 44/50, iter: 125/125, loss: 0.00000, lr: 0.037589, top1: 0.75872, throughput: 480.99 | 2022-04-11 07:28:07.622 [rank:3] [train], epoch: 45/50, iter: 100/834, loss: 0.24036, lr: 0.035821, top1: 0.77068, throughput: 314.44 | 2022-04-11 07:29:08.636 [rank:1] [train], epoch: 45/50, iter: 100/834, loss: 0.23795, lr: 0.035821, top1: 0.77552, throughput: 314.32 | 2022-04-11 07:29:08.649 [rank:2] [train], epoch: 45/50, iter: 100/834, loss: 0.23825, lr: 0.035821, top1: 0.77313, throughput: 314.27 | 2022-04-11 07:29:08.654 [rank:0] [train], epoch: 45/50, iter: 100/834, loss: 0.23842, lr: 0.035821, top1: 0.77750, throughput: 314.14 | 2022-04-11 07:29:08.667 [rank:4] [train], epoch: 45/50, iter: 100/834, loss: 0.24036, lr: 0.035821, top1: 0.77354, throughput: 314.19 | 2022-04-11 07:29:08.677 [rank:5] [train], epoch: 45/50, iter: 100/834, loss: 0.23896, lr: 0.035821, top1: 0.77469, throughput: 314.15 | 2022-04-11 07:29:08.684 [rank:6] [train], epoch: 45/50, iter: 100/834, loss: 0.24068, lr: 0.035821, top1: 0.77021, throughput: 314.41 | 2022-04-11 07:29:08.688 [rank:7] [train], epoch: 45/50, iter: 100/834, loss: 0.23813, lr: 0.035821, top1: 0.77437, throughput: 314.13 | 2022-04-11 07:29:08.697 [rank:4] [train], epoch: 45/50, iter: 200/834, loss: 0.24157, lr: 0.034096, top1: 0.76948, throughput: 311.39 | 2022-04-11 07:30:10.337 [rank:3] [train], epoch: 45/50, iter: 200/834, loss: 0.23959, lr: 0.034096, top1: 0.76938, throughput: 311.10 | 2022-04-11 07:30:10.352 [rank:7] [train], epoch: 45/50, iter: 200/834, loss: 0.23652, lr: 0.034096, top1: 0.77526, throughput: 311.40 | 2022-04-11 07:30:10.354 [rank:6] [train], epoch: 45/50, iter: 200/834, loss: 0.23852, lr: 0.034096, top1: 0.77823, throughput: 311.27 | 2022-04-11 07:30:10.370 [rank:5] [train], epoch: 45/50, iter: 200/834, loss: 0.24024, lr: 0.034096, top1: 0.77286, throughput: 311.21 | 2022-04-11 07:30:10.379 [rank:0] [train], epoch: 45/50, iter: 200/834, loss: 0.23988, lr: 0.034096, top1: 0.77271, throughput: 311.05 | 2022-04-11 07:30:10.394 [rank:1] [train], epoch: 45/50, iter: 200/834, loss: 0.23910, lr: 0.034096, top1: 0.77385, throughput: 311.27 | 2022-04-11 07:30:10.331 [rank:2] [train], epoch: 45/50, iter: 200/834, loss: 0.23919, lr: 0.034096, top1: 0.77443, throughput: 310.80 | 2022-04-11 07:30:10.431 [rank:7] [train], epoch: 45/50, iter: 300/834, loss: 0.23717, lr: 0.032412, top1: 0.77490, throughput: 314.18 | 2022-04-11 07:31:11.467 [rank:0] [train], epoch: 45/50, iter: 300/834, loss: 0.23919, lr: 0.032412, top1: 0.77245, throughput: 314.37 | 2022-04-11 07:31:11.468 [rank:5] [train], epoch: 45/50, iter: 300/834, loss: 0.24035, lr: 0.032412, top1: 0.76635, throughput: 314.25 | 2022-04-11 07:31:11.477 [rank:6] [train], epoch: 45/50, iter: 300/834, loss: 0.23753, lr: 0.032412, top1: 0.77323, throughput: 314.16 | 2022-04-11 07:31:11.485 [rank:4] [train], epoch: 45/50, iter: 300/834, loss: 0.23746, lr: 0.032412, top1: 0.77474, throughput: 313.88 | 2022-04-11 07:31:11.508 [rank:2] [train], epoch: 45/50, iter: 300/834, loss: 0.23850, lr: 0.032412, top1: 0.77250, throughput: 314.32 | 2022-04-11 07:31:11.516 [rank:3] [train], epoch: 45/50, iter: 300/834, loss: 0.24080, lr: 0.032412, top1: 0.76792, throughput: 313.90 | 2022-04-11 07:31:11.517 [rank:1] [train], epoch: 45/50, iter: 300/834, loss: 0.24007, lr: 0.032412, top1: 0.77198, throughput: 313.76 | 2022-04-11 07:31:11.525 [rank:0] [train], epoch: 45/50, iter: 400/834, loss: 0.23940, lr: 0.030769, top1: 0.77422, throughput: 313.72 | 2022-04-11 07:32:12.668 [rank:2] [train], epoch: 45/50, iter: 400/834, loss: 0.23936, lr: 0.030769, top1: 0.77323, throughput: 314.19[rank:6] [train], epoch: 45/50, iter: 400/834, loss: 0.24102, lr: 0.030769, top1: 0.76792, throughput: 313.61 | 2022-04-11 07:32:12.625| 2022-04-11 07:32:12.708 [rank:1] [train], epoch: 45/50, iter: 400/834, loss: 0.23788, lr: 0.030769, top1: 0.77401, throughput: 313.79 | 2022-04-11 07:32:12.712 [rank:5] [train], epoch: 45/50, iter: 400/834, loss: 0.23878, lr: 0.030769, top1: 0.77484, throughput: 313.39 | 2022-04-11 07:32:12.742 [rank:7] [train], epoch: 45/50, iter: 400/834, loss: 0.23839, lr: 0.030769, top1: 0.77437, throughput: 313.33 | 2022-04-11 07:32:12.744 [rank:4] [train], epoch: 45/50, iter: 400/834, loss: 0.23968, lr: 0.030769, top1: 0.77339, throughput: 313.49 | 2022-04-11 07:32:12.754 [rank:3] [train], epoch: 45/50, iter: 400/834, loss: 0.24079, lr: 0.030769, top1: 0.76682, throughput: 313.50 | 2022-04-11 07:32:12.761 [rank:6] [train], epoch: 45/50, iter: 500/834, loss: 0.23882, lr: 0.029169, top1: 0.77271, throughput: 312.02 | 2022-04-11 07:33:14.243 [rank:4] [train], epoch: 45/50, iter: 500/834, loss: 0.23906, lr: 0.029169, top1: 0.77422, throughput: 312.21 | 2022-04-11 07:33:14.250 [rank:7] [train], epoch: 45/50, iter: 500/834, loss: 0.24095, lr: 0.029169, top1: 0.76823, throughput: 312.13 | 2022-04-11 07:33:14.257 [rank:2] [train], epoch: 45/50, iter: 500/834, loss: 0.24026, lr: 0.029169, top1: 0.77005, throughput: 311.46 | 2022-04-11 07:33:14.271 [rank:5] [train], epoch: 45/50, iter: 500/834, loss: 0.23928, lr: 0.029169, top1: 0.77042, throughput: 312.02 | 2022-04-11 07:33:14.276 [rank:1] [train], epoch: 45/50, iter: 500/834, loss: 0.24050, lr: 0.029169, top1: 0.77135, throughput: 311.74 | 2022-04-11 07:33:14.303 [rank:3] [train], epoch: 45/50, iter: 500/834, loss: 0.23988, lr: 0.029169, top1: 0.77036, throughput: 311.93 | 2022-04-11 07:33:14.314 [rank:0] [train], epoch: 45/50, iter: 500/834, loss: 0.23954, lr: 0.029169, top1: 0.77010, throughput: 311.87 | 2022-04-11 07:33:14.233 [rank:4] [train], epoch: 45/50, iter: 600/834, loss: 0.23763, lr: 0.027611, top1: 0.77589, throughput: 312.97 | 2022-04-11 07:34:15.597 [rank:7] [train], epoch: 45/50, iter: 600/834, loss: 0.24002, lr: 0.027611, top1: 0.76927, throughput: 312.97 | 2022-04-11 07:34:15.605 [rank:1] [train], epoch: 45/50, iter: 600/834, loss: 0.23987, lr: 0.027611, top1: 0.76917, throughput: 313.18 | 2022-04-11 07:34:15.609 [rank:5] [train], epoch: 45/50, iter: 600/834, loss: 0.23783, lr: 0.027611, top1: 0.77453, throughput: 313.02 | 2022-04-11 07:34:15.614 [rank:2] [train], epoch: 45/50, iter: 600/834, loss: 0.23881, lr: 0.027611, top1: 0.77151, throughput: 312.88 | 2022-04-11 07:34:15.635 [rank:0] [train], epoch: 45/50, iter: 600/834, loss: 0.23800, lr: 0.027611, top1: 0.77568, throughput: 312.56 | 2022-04-11 07:34:15.662 [rank:3] [train], epoch: 45/50, iter: 600/834, loss: 0.23909, lr: 0.027611, top1: 0.77255, throughput: 312.97 | 2022-04-11 07:34:15.662 [rank:6] [train], epoch: 45/50, iter: 600/834, loss: 0.23798, lr: 0.027611, top1: 0.77698, throughput: 312.57 | 2022-04-11 07:34:15.669 [rank:4] [train], epoch: 45/50, iter: 700/834, loss: 0.23826, lr: 0.026094, top1: 0.77344, throughput: 313.52 | 2022-04-11 07:35:16.838 [rank:0] [train], epoch: 45/50, iter: 700/834, loss: 0.23946, lr: 0.026094, top1: 0.76906, throughput: 313.70 | 2022-04-11 07:35:16.866 [rank:1] [train], epoch: 45/50, iter: 700/834, loss: 0.23981, lr: 0.026094, top1: 0.77026, throughput: 313.39 | 2022-04-11 07:35:16.875 [rank:5] [train], epoch: 45/50, iter: 700/834, loss: 0.23816, lr: 0.026094, top1: 0.77516, throughput: 313.37 | 2022-04-11 07:35:16.884 [rank:2] [train], epoch: 45/50, iter: 700/834, loss: 0.23817, lr: 0.026094, top1: 0.77380, throughput: 313.41 | 2022-04-11 07:35:16.898 [rank:6] [train], epoch: 45/50, iter: 700/834, loss: 0.23985, lr: 0.026094, top1: 0.76943, throughput: 313.57 | 2022-04-11 07:35:16.899 [rank:3] [train], epoch: 45/50, iter: 700/834, loss: 0.24101, lr: 0.026094, top1: 0.77151, throughput: 313.53 | 2022-04-11 07:35:16.899 [rank:7] [train], epoch: 45/50, iter: 700/834, loss: 0.23908, lr: 0.026094, top1: 0.77344, throughput: 313.48 | 2022-04-11 07:35:16.853 [rank:4] [train], epoch: 45/50, iter: 800/834, loss: 0.23803, lr: 0.024620, top1: 0.77677, throughput: 313.30 | 2022-04-11 07:36:18.121 [rank:5] [train], epoch: 45/50, iter: 800/834, loss: 0.23945, lr: 0.024620, top1: 0.77406, throughput: 313.52 | 2022-04-11 07:36:18.125 [rank:0] [train], epoch: 45/50, iter: 800/834, loss: 0.23899, lr: 0.024620, top1: 0.77557, throughput: 313.33 | 2022-04-11 07:36:18.143 [rank:1] [train], epoch: 45/50, iter: 800/834, loss: 0.24007, lr: 0.024620, top1: 0.76859, throughput: 313.35 | 2022-04-11 07:36:18.149 [rank:2] [train], epoch: 45/50, iter: 800/834, loss: 0.23793, lr: 0.024620, top1: 0.77625, throughput: 313.41 | 2022-04-11 07:36:18.159 [rank:6] [train], epoch: 45/50, iter: 800/834, loss: 0.23891, lr: 0.024620, top1: 0.77302, throughput: 313.37 | 2022-04-11 07:36:18.168 [rank:7] [train], epoch: 45/50, iter: 800/834, loss: 0.23953, lr: 0.024620, top1: 0.77214, throughput: 313.12 | 2022-04-11 07:36:18.171 [rank:3] [train], epoch: 45/50, iter: 800/834, loss: 0.23881, lr: 0.024620, top1: 0.77401, throughput: 313.31 | 2022-04-11 07:36:18.180 [rank:4] [train], epoch: 45/50, iter: 834/834, loss: 0.23941, lr: 0.024128, top1: 0.76915, throughput: 311.64 | 2022-04-11 07:36:39.068 [rank:5] [train], epoch: 45/50, iter: 834/834, loss: 0.23901, lr: 0.024128, top1: 0.77528, throughput: 311.62 | 2022-04-11 07:36:39.073 [rank:6] [train], epoch: 45/50, iter: 834/834, loss: 0.24152, lr: 0.024128, top1: 0.76915, throughput: 312.25 | 2022-04-11 07:36:39.074 [rank:2] [train], epoch: 45/50, iter: 834/834, loss: 0.24282, lr: 0.024128, top1: 0.76685, throughput: 312.10 | 2022-04-11 07:36:39.075 [rank:0] [train], epoch: 45/50, iter: 834/834, loss: 0.24051, lr: 0.024128, top1: 0.77099, throughput: 311.85 | 2022-04-11 07:36:39.076 [rank:7] [train], epoch: 45/50, iter: 834/834, loss: 0.23839, lr: 0.024128, top1: 0.77313, throughput: 312.17 | 2022-04-11 07:36:39.083 [rank:1] [train], epoch: 45/50, iter: 834/834, loss: 0.23803, lr: 0.024128, top1: 0.77436, throughput: 311.20 | 2022-04-11 07:36:39.125 [rank:3] [train], epoch: 45/50, iter: 834/834, loss: 0.23674, lr: 0.024128, top1: 0.77206, throughput: 311.57 | 2022-04-11 07:36:39.132 [rank:0] [eval], epoch: 45/50, iter: 125/125, loss: 0.00000, lr: 0.024128, top1: 0.76048, throughput: 490.73 | 2022-04-11 07:36:51.812 [rank:3] [eval], epoch: 45/50, iter: 125/125, loss: 0.00000, lr: 0.024128, top1: 0.75456, throughput: 492.49 | 2022-04-11 07:36:51.823 [rank:2] [eval], epoch: 45/50, iter: 125/125, loss: 0.00000, lr: 0.024128, top1: 0.74992, throughput: 490.26 | 2022-04-11 07:36:51.824 [rank:4] [eval], epoch: 45/50, iter: 125/125, loss: 0.00000, lr: 0.024128, top1: 0.75312, throughput: 489.70 | 2022-04-11 07:36:51.831 [rank:7] [eval], epoch: 45/50, iter: 125/125, loss: 0.00000, lr: 0.024128, top1: 0.76624, throughput: 490.04 | 2022-04-11 07:36:51.837 [rank:5] [eval], epoch: 45/50, iter: 125/125, loss: 0.00000, lr: 0.024128, top1: 0.74928, throughput: 489.31 | 2022-04-11 07:36:51.847 [rank:1] [eval], epoch: 45/50, iter: 125/125, loss: 0.00000, lr: 0.024128, top1: 0.76160, throughput: 490.90 | 2022-04-11 07:36:51.857 [rank:6] [eval], epoch: 45/50, iter: 125/125, loss: 0.00000, lr: 0.024128, top1: 0.76384, throughput: 488.32 | 2022-04-11 07:36:51.873 [rank:1] [train], epoch: 46/50, iter: 100/834, loss: 0.23756, lr: 0.022710, top1: 0.77370, throughput: 313.64 | 2022-04-11 07:37:53.074 [rank:0] [train], epoch: 46/50, iter: 100/834, loss: 0.23487, lr: 0.022710, top1: 0.78422, throughput: 313.68 | 2022-04-11 07:37:53.020 [rank:5] [train], epoch: 46/50, iter: 100/834, loss: 0.23613, lr: 0.022710, top1: 0.78146, throughput: 313.43 | 2022-04-11 07:37:53.104 [rank:6] [train], epoch: 46/50, iter: 100/834, loss: 0.23753, lr: 0.022710, top1: 0.77625, throughput: 313.53 | 2022-04-11 07:37:53.112 [rank:3] [train], epoch: 46/50, iter: 100/834, loss: 0.23568, lr: 0.022710, top1: 0.78130, throughput: 313.27 | 2022-04-11 07:37:53.112 [rank:7] [train], epoch: 46/50, iter: 100/834, loss: 0.23431, lr: 0.022710, top1: 0.78688, throughput: 313.30 | 2022-04-11 07:37:53.120 [rank:4] [train], epoch: 46/50, iter: 100/834, loss: 0.23612, lr: 0.022710, top1: 0.77922, throughput: 313.25 | 2022-04-11 07:37:53.125 [rank:2] [train], epoch: 46/50, iter: 100/834, loss: 0.23725, lr: 0.022710, top1: 0.77760, throughput: 313.57 | 2022-04-11 07:37:53.054 [rank:4] [train], epoch: 46/50, iter: 200/834, loss: 0.23554, lr: 0.021335, top1: 0.78078, throughput: 313.44 | 2022-04-11 07:38:54.381 [rank:5] [train], epoch: 46/50, iter: 200/834, loss: 0.23663, lr: 0.021335, top1: 0.77688, throughput: 313.19 | 2022-04-11 07:38:54.409 [rank:2] [train], epoch: 46/50, iter: 200/834, loss: 0.23570, lr: 0.021335, top1: 0.78224, throughput: 312.81 | 2022-04-11 07:38:54.433 [rank:1] [train], epoch: 46/50, iter: 200/834, loss: 0.23704, lr: 0.021335, top1: 0.77964, throughput: 312.84 | 2022-04-11 07:38:54.448 [rank:0] [train], epoch: 46/50, iter: 200/834, loss: 0.23597, lr: 0.021335, top1: 0.77719, throughput: 312.56 | 2022-04-11 07:38:54.449 [rank:6] [train], epoch: 46/50, iter: 200/834, loss: 0.23594, lr: 0.021335, top1: 0.78167, throughput: 313.01 | 2022-04-11 07:38:54.452 [rank:3] [train], epoch: 46/50, iter: 200/834, loss: 0.23575, lr: 0.021335, top1: 0.78047, throughput: 312.93 | 2022-04-11 07:38:54.468 [rank:7] [train], epoch: 46/50, iter: 200/834, loss: 0.23636, lr: 0.021335, top1: 0.77531, throughput: 312.89 | 2022-04-11 07:38:54.483 [rank:5] [train], epoch: 46/50, iter: 300/834, loss: 0.23564, lr: 0.020002, top1: 0.77672, throughput: 313.71 | 2022-04-11 07:39:55.613 [rank:6] [train], epoch: 46/50, iter: 300/834, loss: 0.23758, lr: 0.020002, top1: 0.77776, throughput: 313.90 | 2022-04-11 07:39:55.617 [rank:0] [train], epoch: 46/50, iter: 300/834, loss: 0.23532, lr: 0.020002, top1: 0.78302, throughput: 313.82 | 2022-04-11 07:39:55.631 [rank:2] [train], epoch: 46/50, iter: 300/834, loss: 0.23631, lr: 0.020002, top1: 0.78042, throughput: 313.62 | 2022-04-11 07:39:55.653 [rank:3] [train], epoch: 46/50, iter: 300/834, loss: 0.23617, lr: 0.020002, top1: 0.78052, throughput: 313.69 | 2022-04-11 07:39:55.676 [rank:4] [train], epoch: 46/50, iter: 300/834, loss: 0.23815, lr: 0.020002, top1: 0.77729, throughput: 313.19 | 2022-04-11 07:39:55.685 [rank:7] [train], epoch: 46/50, iter: 300/834, loss: 0.23494, lr: 0.020002, top1: 0.78177, throughput: 314.09 | 2022-04-11 07:39:55.612 [rank:1] [train], epoch: 46/50, iter: 300/834, loss: 0.23552, lr: 0.020002, top1: 0.77859, throughput: 313.85 | 2022-04-11 07:39:55.623 [rank:6] [train], epoch: 46/50, iter: 400/834, loss: 0.23769, lr: 0.018711, top1: 0.77620, throughput: 313.29 | 2022-04-11 07:40:56.902 [rank:7] [train], epoch: 46/50, iter: 400/834, loss: 0.23780, lr: 0.018711, top1: 0.77370, throughput: 313.10 | 2022-04-11 07:40:56.935 [rank:3] [train], epoch: 46/50, iter: 400/834, loss: 0.23613, lr: 0.018711, top1: 0.77917, throughput: 313.39 | 2022-04-11 07:40:56.940 [rank:4] [train], epoch: 46/50, iter: 400/834, loss: 0.23552, lr: 0.018711, top1: 0.77833, throughput: 313.44 | 2022-04-11 07:40:56.941 [rank:2] [train], epoch: 46/50, iter: 400/834, loss: 0.23752, lr: 0.018711, top1: 0.77646, throughput: 313.09 | 2022-04-11 07:40:56.979 [rank:5] [train], epoch: 46/50, iter: 400/834, loss: 0.23660, lr: 0.018711, top1: 0.77526, throughput: 313.30 | 2022-04-11 07:40:56.896 [rank:1] [train], epoch: 46/50, iter: 400/834, loss: 0.23611, lr: 0.018711, top1: 0.78120, throughput: 312.84 | 2022-04-11 07:40:56.997 [rank:0] [train], epoch: 46/50, iter: 400/834, loss: 0.23592, lr: 0.018711, top1: 0.78375, throughput: 312.83 | 2022-04-11 07:40:57.007 [rank:5] [train], epoch: 46/50, iter: 500/834, loss: 0.23488, lr: 0.017463, top1: 0.77948, throughput: 312.83 | 2022-04-11 07:41:58.271 [rank:0] [train], epoch: 46/50, iter: 500/834, loss: 0.23378, lr: 0.017463, top1: 0.78245, throughput: 313.39 | 2022-04-11 07:41:58.273 [rank:4] [train], epoch: 46/50, iter: 500/834, loss: 0.23554, lr: 0.017463, top1: 0.77849, throughput: 312.95 | 2022-04-11 07:41:58.293 [rank:7] [train], epoch: 46/50, iter: 500/834, loss: 0.23502, lr: 0.017463, top1: 0.78182, throughput: 312.81 | 2022-04-11 07:41:58.313 [rank:6] [train], epoch: 46/50, iter: 500/834, loss: 0.23557, lr: 0.017463, top1: 0.78240, throughput: 312.63[rank:2] [train], epoch: 46/50, iter: 500/834, loss: 0.23575, lr: 0.017463, top1: 0.78135, throughput: 313.02 | 2022-04-11 07:41:58.317 | 2022-04-11 07:41:58.317 [rank:3] [train], epoch: 46/50, iter: 500/834, loss: 0.23570, lr: 0.017463, top1: 0.77943, throughput: 312.80 | 2022-04-11 07:41:58.321 [rank:1] [train], epoch: 46/50, iter: 500/834, loss: 0.23858, lr: 0.017463, top1: 0.77589, throughput: 312.99 | 2022-04-11 07:41:58.341 [rank:4] [train], epoch: 46/50, iter: 600/834, loss: 0.23519, lr: 0.016257, top1: 0.78172, throughput: 313.74 | 2022-04-11 07:42:59.491 [rank:1] [train], epoch: 46/50, iter: 600/834, loss: 0.23675, lr: 0.016257, top1: 0.77917, throughput: 313.85 | 2022-04-11 07:42:59.517 [rank:7] [train], epoch: 46/50, iter: 600/834, loss: 0.23607, lr: 0.016257, top1: 0.78224, throughput: 313.67 | 2022-04-11 07:42:59.524 [rank:5] [train], epoch: 46/50, iter: 600/834, loss: 0.23634, lr: 0.016257, top1: 0.77865, throughput: 313.45 | 2022-04-11 07:42:59.524 [rank:6] [train], epoch: 46/50, iter: 600/834, loss: 0.23607, lr: 0.016257, top1: 0.78245, throughput: 313.68 | 2022-04-11 07:42:59.526 [rank:2] [train], epoch: 46/50, iter: 600/834, loss: 0.23632, lr: 0.016257, top1: 0.78187, throughput: 313.67 | 2022-04-11 07:42:59.528 [rank:0] [train], epoch: 46/50, iter: 600/834, loss: 0.23482, lr: 0.016257, top1: 0.77969, throughput: 313.30 | 2022-04-11 07:42:59.556 [rank:3] [train], epoch: 46/50, iter: 600/834, loss: 0.23626, lr: 0.016257, top1: 0.77828, throughput: 313.53 | 2022-04-11 07:42:59.559 [rank:4] [train], epoch: 46/50, iter: 700/834, loss: 0.23695, lr: 0.015095, top1: 0.77531, throughput: 312.18 | 2022-04-11 07:44:00.994 [rank:7] [train], epoch: 46/50, iter: 700/834, loss: 0.23679, lr: 0.015095, top1: 0.77536, throughput: 312.18 | 2022-04-11 07:44:01.027 [rank:3] [train], epoch: 46/50, iter: 700/834, loss: 0.23413, lr: 0.015095, top1: 0.78411, throughput: 312.31 | 2022-04-11 07:44:01.037 [rank:5] [train], epoch: 46/50, iter: 700/834, loss: 0.23439, lr: 0.015095, top1: 0.78292, throughput: 312.04 | 2022-04-11 07:44:01.054 [rank:0] [train], epoch: 46/50, iter: 700/834, loss: 0.23571, lr: 0.015095, top1: 0.78156, throughput: 312.15 | 2022-04-11 07:44:01.065 [rank:6] [train], epoch: 46/50, iter: 700/834, loss: 0.23519, lr: 0.015095, top1: 0.78188, throughput: 311.92 | 2022-04-11 07:44:01.080 [rank:1] [train], epoch: 46/50, iter: 700/834, loss: 0.23775, lr: 0.015095, top1: 0.77583, throughput: 311.85 | 2022-04-11 07:44:01.084 [rank:2] [train], epoch: 46/50, iter: 700/834, loss: 0.23542, lr: 0.015095, top1: 0.78031, throughput: 311.86 | 2022-04-11 07:44:01.094 [rank:1] [train], epoch: 46/50, iter: 800/834, loss: 0.23482, lr: 0.013974, top1: 0.78344, throughput: 313.99 | 2022-04-11 07:45:02.234 [rank:6] [train], epoch: 46/50, iter: 800/834, loss: 0.23516, lr: 0.013974, top1: 0.78089, throughput: 313.85 | 2022-04-11 07:45:02.255 [rank:2] [train], epoch: 46/50, iter: 800/834, loss: 0.23682, lr: 0.013974, top1: 0.77906, throughput: 313.86 | 2022-04-11 07:45:02.267 [rank:5] [train], epoch: 46/50, iter: 800/834, loss: 0.23641, lr: 0.013974, top1: 0.77708, throughput: 313.66 | 2022-04-11 07:45:02.267 [rank:0] [train], epoch: 46/50, iter: 800/834, loss: 0.23475, lr: 0.013974, top1: 0.77995, throughput: 313.66 | 2022-04-11 07:45:02.277 [rank:4] [train], epoch: 46/50, iter: 800/834, loss: 0.23545, lr: 0.013974, top1: 0.78161, throughput: 313.30 | 2022-04-11 07:45:02.278 [rank:7] [train], epoch: 46/50, iter: 800/834, loss: 0.23652, lr: 0.013974, top1: 0.77776, throughput: 313.42 | 2022-04-11 07:45:02.286 [rank:3] [train], epoch: 46/50, iter: 800/834, loss: 0.23539, lr: 0.013974, top1: 0.78000, throughput: 313.83 | 2022-04-11 07:45:02.217 [rank:4] [train], epoch: 46/50, iter: 834/834, loss: 0.23958, lr: 0.013603, top1: 0.77114, throughput: 312.77 | 2022-04-11 07:45:23.150 [rank:2] [train], epoch: 46/50, iter: 834/834, loss: 0.23435, lr: 0.013603, top1: 0.78431, throughput: 312.59 | 2022-04-11 07:45:23.151 [rank:0] [train], epoch: 46/50, iter: 834/834, loss: 0.23533, lr: 0.013603, top1: 0.77926, throughput: 312.74 | 2022-04-11 07:45:23.151 [rank:3] [train], epoch: 46/50, iter: 834/834, loss: 0.23612, lr: 0.013603, top1: 0.78171, throughput: 311.73 | 2022-04-11 07:45:23.158 [rank:5] [train], epoch: 46/50, iter: 834/834, loss: 0.23265, lr: 0.013603, top1: 0.78293, throughput: 312.47 | 2022-04-11 07:45:23.159 [rank:1] [train], epoch: 46/50, iter: 834/834, loss: 0.23998, lr: 0.013603, top1: 0.76654, throughput: 311.84 | 2022-04-11 07:45:23.167 [rank:7] [train], epoch: 46/50, iter: 834/834, loss: 0.23337, lr: 0.013603, top1: 0.78232, throughput: 312.35 | 2022-04-11 07:45:23.186 [rank:6] [train], epoch: 46/50, iter: 834/834, loss: 0.23768, lr: 0.013603, top1: 0.76808, throughput: 311.72 | 2022-04-11 07:45:23.197 [rank:0] [eval], epoch: 46/50, iter: 125/125, loss: 0.00000, lr: 0.013603, top1: 0.76320, throughput: 490.31 | 2022-04-11 07:45:35.898 [rank:1] [eval], epoch: 46/50, iter: 125/125, loss: 0.00000, lr: 0.013603, top1: 0.76672, throughput: 490.54 | 2022-04-11 07:45:35.908 [rank:2] [eval], epoch: 46/50, iter: 125/125, loss: 0.00000, lr: 0.013603, top1: 0.75184, throughput: 489.91 | 2022-04-11 07:45:35.908 [rank:3] [eval], epoch: 46/50, iter: 125/125, loss: 0.00000, lr: 0.013603, top1: 0.75888, throughput: 489.93 | 2022-04-11 07:45:35.915 [rank:5] [eval], epoch: 46/50, iter: 125/125, loss: 0.00000, lr: 0.013603, top1: 0.75696, throughput: 489.68 | 2022-04-11 07:45:35.922 [rank:4] [eval], epoch: 46/50, iter: 125/125, loss: 0.00000, lr: 0.013603, top1: 0.75680, throughput: 489.28 | 2022-04-11 07:45:35.923 [rank:7] [eval], epoch: 46/50, iter: 125/125, loss: 0.00000, lr: 0.013603, top1: 0.76336, throughput: 490.25 | 2022-04-11 07:45:35.934 [rank:6] [eval], epoch: 46/50, iter: 125/125, loss: 0.00000, lr: 0.013603, top1: 0.76560, throughput: 489.76 | 2022-04-11 07:45:35.958 [rank:4] [train], epoch: 47/50, iter: 100/834, loss: 0.23592, lr: 0.012541, top1: 0.77885, throughput: 312.66 | 2022-04-11 07:46:37.331 [rank:1] [train], epoch: 47/50, iter: 100/834, loss: 0.23301, lr: 0.012541, top1: 0.78974, throughput: 312.49 | 2022-04-11 07:46:37.351 [rank:7] [train], epoch: 47/50, iter: 100/834, loss: 0.23437, lr: 0.012541, top1: 0.78089, throughput: 312.58 | 2022-04-11 07:46:37.358 [rank:6] [train], epoch: 47/50, iter: 100/834, loss: 0.23510, lr: 0.012541, top1: 0.78297, throughput: 312.69 | 2022-04-11 07:46:37.360 [rank:2] [train], epoch: 47/50, iter: 100/834, loss: 0.23557, lr: 0.012541, top1: 0.77802, throughput: 312.41 | 2022-04-11 07:46:37.367 [rank:0] [train], epoch: 47/50, iter: 100/834, loss: 0.23486, lr: 0.012541, top1: 0.78547, throughput: 312.26 | 2022-04-11 07:46:37.385 [rank:3] [train], epoch: 47/50, iter: 100/834, loss: 0.23542, lr: 0.012541, top1: 0.78062, throughput: 312.34 | 2022-04-11 07:46:37.386 [rank:5] [train], epoch: 47/50, iter: 100/834, loss: 0.23308, lr: 0.012541, top1: 0.78672, throughput: 312.35 | 2022-04-11 07:46:37.392 [rank:4] [train], epoch: 47/50, iter: 200/834, loss: 0.23495, lr: 0.011521, top1: 0.78297, throughput: 312.26 | 2022-04-11 07:47:38.819 [rank:2] [train], epoch: 47/50, iter: 200/834, loss: 0.23508, lr: 0.011521, top1: 0.78484, throughput: 312.43 | 2022-04-11 07:47:38.821 [rank:5] [train], epoch: 47/50, iter: 200/834, loss: 0.23448, lr: 0.011521, top1: 0.78391, throughput: 312.53 | 2022-04-11 07:47:38.826 [rank:0] [train], epoch: 47/50, iter: 200/834, loss: 0.23373, lr: 0.011521, top1: 0.78661, throughput: 312.49 | 2022-04-11 07:47:38.826 [rank:1] [train], epoch: 47/50, iter: 200/834, loss: 0.23296, lr: 0.011521, top1: 0.78766, throughput: 312.31 | 2022-04-11 07:47:38.828 [rank:6] [train], epoch: 47/50, iter: 200/834, loss: 0.23697, lr: 0.011521, top1: 0.77594, throughput: 312.28 | 2022-04-11 07:47:38.842 [rank:7] [train], epoch: 47/50, iter: 200/834, loss: 0.23436, lr: 0.011521, top1: 0.78594, throughput: 312.23 | 2022-04-11 07:47:38.851 [rank:3] [train], epoch: 47/50, iter: 200/834, loss: 0.23457, lr: 0.011521, top1: 0.78349, throughput: 312.32 | 2022-04-11 07:47:38.860 [rank:5] [train], epoch: 47/50, iter: 300/834, loss: 0.23283, lr: 0.010544, top1: 0.78349, throughput: 313.38 | 2022-04-11 07:48:40.093 [rank:2] [train], epoch: 47/50, iter: 300/834, loss: 0.23540, lr: 0.010544, top1: 0.78109, throughput: 313.29 | 2022-04-11 07:48:40.107 [rank:6] [train], epoch: 47/50, iter: 300/834, loss: 0.23550, lr: 0.010544, top1: 0.78036, throughput: 313.34 | 2022-04-11 07:48:40.117 [rank:7] [train], epoch: 47/50, iter: 300/834, loss: 0.23642, lr: 0.010544, top1: 0.78115, throughput: 313.34 | 2022-04-11 07:48:40.127 [rank:3] [train], epoch: 47/50, iter: 300/834, loss: 0.23504, lr: 0.010544, top1: 0.78599, throughput: 313.33 | 2022-04-11 07:48:40.137 [rank:0] [train], epoch: 47/50, iter: 300/834, loss: 0.23345, lr: 0.010544, top1: 0.78286, throughput: 312.99 | 2022-04-11 07:48:40.170 [rank:4] [train], epoch: 47/50, iter: 300/834, loss: 0.23546, lr: 0.010544, top1: 0.78203, throughput: 312.89 | 2022-04-11 07:48:40.182 [rank:1] [train], epoch: 47/50, iter: 300/834, loss: 0.23357, lr: 0.010544, top1: 0.78531, throughput: 312.83 | 2022-04-11 07:48:40.202 [rank:5] [train], epoch: 47/50, iter: 400/834, loss: 0.23374, lr: 0.009610, top1: 0.78427, throughput: 312.11 | 2022-04-11 07:49:41.610 [rank:7] [train], epoch: 47/50, iter: 400/834, loss: 0.23445, lr: 0.009610, top1: 0.78568, throughput: 312.21 | 2022-04-11 07:49:41.625 [rank:3] [train], epoch: 47/50, iter: 400/834, loss: 0.23297, lr: 0.009610, top1: 0.78615, throughput: 312.15 | 2022-04-11 07:49:41.647 [rank:4] [train], epoch: 47/50, iter: 400/834, loss: 0.23689, lr: 0.009610, top1: 0.77797, throughput: 312.27 | 2022-04-11 07:49:41.668 [rank:1] [train], epoch: 47/50, iter: 400/834, loss: 0.23400, lr: 0.009610, top1: 0.78396, throughput: 312.32 | 2022-04-11 07:49:41.678 [rank:6] [train], epoch: 47/50, iter: 400/834, loss: 0.23376, lr: 0.009610, top1: 0.78458, throughput: 311.88 | 2022-04-11 07:49:41.678 [rank:0] [train], epoch: 47/50, iter: 400/834, loss: 0.23323, lr: 0.009610, top1: 0.78510, throughput: 312.07 | 2022-04-11 07:49:41.694 [rank:2] [train], epoch: 47/50, iter: 400/834, loss: 0.23513, lr: 0.009610, top1: 0.78156, throughput: 311.72 | 2022-04-11 07:49:41.700 [rank:6] [train], epoch: 47/50, iter: 500/834, loss: 0.23526, lr: 0.008719, top1: 0.78135, throughput: 313.75 | 2022-04-11 07:50:42.873 [rank:4] [train], epoch: 47/50, iter: 500/834, loss: 0.23179, lr: 0.008719, top1: 0.79120, throughput: 313.65 | 2022-04-11 07:50:42.882 [rank:0] [train], epoch: 47/50, iter: 500/834, loss: 0.23576, lr: 0.008719, top1: 0.78016, throughput: 313.61 | 2022-04-11 07:50:42.918 [rank:5] [train], epoch: 47/50, iter: 500/834, loss: 0.23355, lr: 0.008719, top1: 0.78724, throughput: 313.05 | 2022-04-11 07:50:42.942 [rank:2] [train], epoch: 47/50, iter: 500/834, loss: 0.23117, lr: 0.008719, top1: 0.78875, throughput: 313.46 | 2022-04-11 07:50:42.952 [rank:1] [train], epoch: 47/50, iter: 500/834, loss: 0.23337, lr: 0.008719, top1: 0.78370, throughput: 313.23 | 2022-04-11 07:50:42.976 [rank:3] [train], epoch: 47/50, iter: 500/834, loss: 0.23436, lr: 0.008719, top1: 0.78245, throughput: 313.02 | 2022-04-11 07:50:42.985 [rank:7] [train], epoch: 47/50, iter: 500/834, loss: 0.23494, lr: 0.008719, top1: 0.78224, throughput: 312.83 | 2022-04-11 07:50:43.001 [rank:5] [train], epoch: 47/50, iter: 600/834, loss: 0.23476, lr: 0.007871, top1: 0.78406, throughput: 313.13 | 2022-04-11 07:51:44.258 [rank:4] [train], epoch: 47/50, iter: 600/834, loss: 0.23347, lr: 0.007871, top1: 0.78385, throughput: 312.81 | 2022-04-11 07:51:44.260 [rank:0] [train], epoch: 47/50, iter: 600/834, loss: 0.23457, lr: 0.007871, top1: 0.78276, throughput: 312.90 | 2022-04-11 07:51:44.280 [rank:2] [train], epoch: 47/50, iter: 600/834, loss: 0.23405, lr: 0.007871, top1: 0.78286, throughput: 312.96 | 2022-04-11 07:51:44.302 [rank:1] [train], epoch: 47/50, iter: 600/834, loss: 0.23344, lr: 0.007871, top1: 0.78688, throughput: 313.05 | 2022-04-11 07:51:44.307 [rank:3] [train], epoch: 47/50, iter: 600/834, loss: 0.23432, lr: 0.007871, top1: 0.78422, throughput: 313.09 | 2022-04-11 07:51:44.310 [rank:7] [train], epoch: 47/50, iter: 600/834, loss: 0.23508, lr: 0.007871, top1: 0.78151, throughput: 313.50 | 2022-04-11 07:51:44.244 [rank:6] [train], epoch: 47/50, iter: 600/834, loss: 0.23115, lr: 0.007871, top1: 0.78901, throughput: 312.31 | 2022-04-11 07:51:44.350 [rank:6] [train], epoch: 47/50, iter: 700/834, loss: 0.23327, lr: 0.007066, top1: 0.78479, throughput: 314.85 | 2022-04-11 07:52:45.332 [rank:0] [train], epoch: 47/50, iter: 700/834, loss: 0.23476, lr: 0.007066, top1: 0.78453, throughput: 314.43 | 2022-04-11 07:52:45.343 [rank:7] [train], epoch: 47/50, iter: 700/834, loss: 0.23634, lr: 0.007066, top1: 0.77922, throughput: 314.16 | 2022-04-11 07:52:45.360 [rank:5] [train], epoch: 47/50, iter: 700/834, loss: 0.23489, lr: 0.007066, top1: 0.78141, throughput: 314.13 | 2022-04-11 07:52:45.379 [rank:1] [train], epoch: 47/50, iter: 700/834, loss: 0.23413, lr: 0.007066, top1: 0.78396, throughput: 314.28 | 2022-04-11 07:52:45.400 [rank:2] [train], epoch: 47/50, iter: 700/834, loss: 0.23377, lr: 0.007066, top1: 0.78448, throughput: 314.65 | 2022-04-11 07:52:45.322 [rank:4] [train], epoch: 47/50, iter: 700/834, loss: 0.23314, lr: 0.007066, top1: 0.78708, throughput: 313.80 | 2022-04-11 07:52:45.445 [rank:3] [train], epoch: 47/50, iter: 700/834, loss: 0.23442, lr: 0.007066, top1: 0.78188, throughput: 313.95 | 2022-04-11 07:52:45.465 [rank:1] [train], epoch: 47/50, iter: 800/834, loss: 0.23545, lr: 0.006305, top1: 0.78068, throughput: 313.72 | 2022-04-11 07:53:46.601 [rank:2] [train], epoch: 47/50, iter: 800/834, loss: 0.23326, lr: 0.006305, top1: 0.78698, throughput: 313.17 | 2022-04-11 07:53:46.631 [rank:7] [train], epoch: 47/50, iter: 800/834, loss: 0.23696, lr: 0.006305, top1: 0.77719, throughput: 313.32 | 2022-04-11 07:53:46.638 [rank:0] [train], epoch: 47/50, iter: 800/834, loss: 0.23416, lr: 0.006305, top1: 0.78250, throughput: 313.22 | 2022-04-11 07:53:46.641 [rank:6] [train], epoch: 47/50, iter: 800/834, loss: 0.23145, lr: 0.006305, top1: 0.78948, throughput: 313.14 | 2022-04-11 07:53:46.646 [rank:3] [train], epoch: 47/50, iter: 800/834, loss: 0.23467, lr: 0.006305, top1: 0.78542, throughput: 313.74 | 2022-04-11 07:53:46.662 [rank:5] [train], epoch: 47/50, iter: 800/834, loss: 0.23643, lr: 0.006305, top1: 0.77927, throughput: 313.29 | 2022-04-11 07:53:46.664 [rank:4] [train], epoch: 47/50, iter: 800/834, loss: 0.23138, lr: 0.006305, top1: 0.78844, throughput: 313.58 | 2022-04-11 07:53:46.674 [rank:1] [train], epoch: 47/50, iter: 834/834, loss: 0.22928, lr: 0.006056, top1: 0.80009, throughput: 310.31 | 2022-04-11 07:54:07.638 [rank:7] [train], epoch: 47/50, iter: 834/834, loss: 0.23326, lr: 0.006056, top1: 0.78462, throughput: 310.66 | 2022-04-11 07:54:07.652 [rank:2] [train], epoch: 47/50, iter: 834/834, loss: 0.23521, lr: 0.006056, top1: 0.78278, throughput: 310.53 | 2022-04-11 07:54:07.653 [rank:5] [train], epoch: 47/50, iter: 834/834, loss: 0.23035, lr: 0.006056, top1: 0.79289, throughput: 310.99 | 2022-04-11 07:54:07.655 [rank:4] [train], epoch: 47/50, iter: 834/834, loss: 0.23489, lr: 0.006056, top1: 0.78002, throughput: 311.07 | 2022-04-11 07:54:07.660 [rank:0] [train], epoch: 47/50, iter: 834/834, loss: 0.23722, lr: 0.006056, top1: 0.77619, throughput: 310.57 | 2022-04-11 07:54:07.660 [rank:3] [train], epoch: 47/50, iter: 834/834, loss: 0.23229, lr: 0.006056, top1: 0.78631, throughput: 310.64 | 2022-04-11 07:54:07.676 [rank:6] [train], epoch: 47/50, iter: 834/834, loss: 0.23628, lr: 0.006056, top1: 0.77558, throughput: 310.41 | 2022-04-11 07:54:07.676 [rank:0] [eval], epoch: 47/50, iter: 125/125, loss: 0.00000, lr: 0.006056, top1: 0.76144, throughput: 487.41 | 2022-04-11 07:54:20.483 [rank:4] [eval], epoch: 47/50, iter: 125/125, loss: 0.00000, lr: 0.006056, top1: 0.75664, throughput: 487.19 | 2022-04-11 07:54:20.489 [rank:3] [eval], epoch: 47/50, iter: 125/125, loss: 0.00000, lr: 0.006056, top1: 0.76016, throughput: 487.65 | 2022-04-11 07:54:20.493 [rank:7] [eval], epoch: 47/50, iter: 125/125, loss: 0.00000, lr: 0.006056, top1: 0.76928, throughput: 485.97 | 2022-04-11 07:54:20.513 [rank:2] [eval], epoch: 47/50, iter: 125/125, loss: 0.00000, lr: 0.006056, top1: 0.75328, throughput: 485.49 | 2022-04-11 07:54:20.526 [rank:5] [eval], epoch: 47/50, iter: 125/125, loss: 0.00000, lr: 0.006056, top1: 0.75872, throughput: 484.49 | 2022-04-11 07:54:20.555 [rank:6] [eval], epoch: 47/50, iter: 125/125, loss: 0.00000, lr: 0.006056, top1: 0.76800, throughput: 485.07 | 2022-04-11 07:54:20.561 [rank:1] [eval], epoch: 47/50, iter: 125/125, loss: 0.00000, lr: 0.006056, top1: 0.76880, throughput: 482.79 | 2022-04-11 07:54:20.583 [rank:3] [train], epoch: 48/50, iter: 100/834, loss: 0.23378, lr: 0.005352, top1: 0.78547, throughput: 313.21 | 2022-04-11 07:55:21.793 [rank:6] [train], epoch: 48/50, iter: 100/834, loss: 0.23321, lr: 0.005352, top1: 0.78599, throughput: 313.56 | 2022-04-11 07:55:21.793 [rank:5] [train], epoch: 48/50, iter: 100/834, loss: 0.23366, lr: 0.005352, top1: 0.78427, throughput: 313.46 | 2022-04-11 07:55:21.806 [rank:2] [train], epoch: 48/50, iter: 100/834, loss: 0.23429, lr: 0.005352, top1: 0.78026, throughput: 313.26 | 2022-04-11 07:55:21.817 [rank:1] [train], epoch: 48/50, iter: 100/834, loss: 0.23195, lr: 0.005352, top1: 0.78870, throughput: 313.53 | 2022-04-11 07:55:21.822 [rank:7] [train], epoch: 48/50, iter: 100/834, loss: 0.23151, lr: 0.005352, top1: 0.78938, throughput: 313.08 | 2022-04-11 07:55:21.838 [rank:4] [train], epoch: 48/50, iter: 100/834, loss: 0.23215, lr: 0.005352, top1: 0.78943, throughput: 312.89 | 2022-04-11 07:55:21.853 [rank:0] [train], epoch: 48/50, iter: 100/834, loss: 0.23202, lr: 0.005352, top1: 0.78698, throughput: 313.24 | 2022-04-11 07:55:21.777 [rank:0] [train], epoch: 48/50, iter: 200/834, loss: 0.23294, lr: 0.004692, top1: 0.78682, throughput: 312.87 | 2022-04-11 07:56:23.144 [rank:5] [train], epoch: 48/50, iter: 200/834, loss: 0.23002, lr: 0.004692, top1: 0.79490, throughput: 312.94 | 2022-04-11 07:56:23.161 [rank:6] [train], epoch: 48/50, iter: 200/834, loss: 0.23260, lr: 0.004692, top1: 0.78703, throughput: 312.82 | 2022-04-11 07:56:23.170 [rank:4] [train], epoch: 48/50, iter: 200/834, loss: 0.23319, lr: 0.004692, top1: 0.78396, throughput: 313.12 | 2022-04-11 07:56:23.171 [rank:7] [train], epoch: 48/50, iter: 200/834, loss: 0.23343, lr: 0.004692, top1: 0.78161, throughput: 312.98 | 2022-04-11 07:56:23.184 [rank:2] [train], epoch: 48/50, iter: 200/834, loss: 0.23353, lr: 0.004692, top1: 0.78427, throughput: 312.82 | 2022-04-11 07:56:23.193 [rank:3] [train], epoch: 48/50, iter: 200/834, loss: 0.23231, lr: 0.004692, top1: 0.78906, throughput: 312.59 | 2022-04-11 07:56:23.215 [rank:1] [train], epoch: 48/50, iter: 200/834, loss: 0.23241, lr: 0.004692, top1: 0.78646, throughput: 312.62 | 2022-04-11 07:56:23.238 [rank:5] [train], epoch: 48/50, iter: 300/834, loss: 0.23317, lr: 0.004075, top1: 0.78464, throughput: 313.19 | 2022-04-11 07:57:24.466 [rank:6] [train], epoch: 48/50, iter: 300/834, loss: 0.23326, lr: 0.004075, top1: 0.78896, throughput: 313.05 | 2022-04-11 07:57:24.502 [rank:4] [train], epoch: 48/50, iter: 300/834, loss: 0.23547, lr: 0.004075, top1: 0.78146, throughput: 313.05 | 2022-04-11 07:57:24.503 [rank:3] [train], epoch: 48/50, iter: 300/834, loss: 0.23366, lr: 0.004075, top1: 0.78401, throughput: 313.20 | 2022-04-11 07:57:24.517 [rank:0] [train], epoch: 48/50, iter: 300/834, loss: 0.23237, lr: 0.004075, top1: 0.78651, throughput: 312.83 | 2022-04-11 07:57:24.519 [rank:2] [train], epoch: 48/50, iter: 300/834, loss: 0.23298, lr: 0.004075, top1: 0.78328, throughput: 312.94 | 2022-04-11 07:57:24.547 [rank:1] [train], epoch: 48/50, iter: 300/834, loss: 0.23314, lr: 0.004075, top1: 0.78635, throughput: 313.08 | 2022-04-11 07:57:24.564 [rank:7] [train], epoch: 48/50, iter: 300/834, loss: 0.23580, lr: 0.004075, top1: 0.78229, throughput: 313.24 | 2022-04-11 07:57:24.480 [rank:4] [train], epoch: 48/50, iter: 400/834, loss: 0.23313, lr: 0.003502, top1: 0.78609, throughput: 314.07 | 2022-04-11 07:58:25.636 [rank:0] [train], epoch: 48/50, iter: 400/834, loss: 0.23338, lr: 0.003502, top1: 0.78417, throughput: 314.15 | 2022-04-11 07:58:25.637 [rank:2] [train], epoch: 48/50, iter: 400/834, loss: 0.23225, lr: 0.003502, top1: 0.78677, throughput: 314.21 | 2022-04-11 07:58:25.652 [rank:3] [train], epoch: 48/50, iter: 400/834, loss: 0.23334, lr: 0.003502, top1: 0.78328, throughput: 313.99 | 2022-04-11 07:58:25.665 [rank:6] [train], epoch: 48/50, iter: 400/834, loss: 0.23070, lr: 0.003502, top1: 0.78927, throughput: 313.86 | 2022-04-11 07:58:25.677 [rank:5] [train], epoch: 48/50, iter: 400/834, loss: 0.23373, lr: 0.003502, top1: 0.78120, throughput: 313.66 | 2022-04-11 07:58:25.679 [rank:1] [train], epoch: 48/50, iter: 400/834, loss: 0.23110, lr: 0.003502, top1: 0.78979, throughput: 314.56 | 2022-04-11 07:58:25.602 [rank:7] [train], epoch: 48/50, iter: 400/834, loss: 0.23375, lr: 0.003502, top1: 0.78224, throughput: 313.60 | 2022-04-11 07:58:25.704 [rank:5] [train], epoch: 48/50, iter: 500/834, loss: 0.23413, lr: 0.002971, top1: 0.78339, throughput: 313.80 | 2022-04-11 07:59:26.864 [rank:3] [train], epoch: 48/50, iter: 500/834, loss: 0.23394, lr: 0.002971, top1: 0.78479, throughput: 313.72 | 2022-04-11 07:59:26.866 [rank:4] [train], epoch: 48/50, iter: 500/834, loss: 0.23135, lr: 0.002971, top1: 0.78969, throughput: 313.55 | 2022-04-11 07:59:26.870 [rank:2] [train], epoch: 48/50, iter: 500/834, loss: 0.23302, lr: 0.002971, top1: 0.78839, throughput: 313.63 | 2022-04-11 07:59:26.870 [rank:0] [train], epoch: 48/50, iter: 500/834, loss: 0.23458, lr: 0.002971, top1: 0.78318, throughput: 313.47 | 2022-04-11 07:59:26.887 [rank:6] [train], epoch: 48/50, iter: 500/834, loss: 0.23224, lr: 0.002971, top1: 0.78781, throughput: 313.51 | 2022-04-11 07:59:26.918 [rank:1] [train], epoch: 48/50, iter: 500/834, loss: 0.23316, lr: 0.002971, top1: 0.78958, throughput: 313.13 | 2022-04-11 07:59:26.919 [rank:7] [train], epoch: 48/50, iter: 500/834, loss: 0.23457, lr: 0.002971, top1: 0.78266, throughput: 313.28 | 2022-04-11 07:59:26.991 [rank:7] [train], epoch: 48/50, iter: 600/834, loss: 0.23197, lr: 0.002485, top1: 0.78724, throughput: 314.96 | 2022-04-11 08:00:27.951 [rank:2] [train], epoch: 48/50, iter: 600/834, loss: 0.23346, lr: 0.002485, top1: 0.78422, throughput: 314.29 | 2022-04-11 08:00:27.961 [rank:5] [train], epoch: 48/50, iter: 600/834, loss: 0.23398, lr: 0.002485, top1: 0.78255, throughput: 314.22 | 2022-04-11 08:00:27.967 [rank:6] [train], epoch: 48/50, iter: 600/834, loss: 0.23580, lr: 0.002485, top1: 0.78062, throughput: 314.48 | 2022-04-11 08:00:27.970 [rank:0] [train], epoch: 48/50, iter: 600/834, loss: 0.23274, lr: 0.002485, top1: 0.78724, throughput: 314.30 | 2022-04-11 08:00:27.974 [rank:4] [train], epoch: 48/50, iter: 600/834, loss: 0.23230, lr: 0.002485, top1: 0.78526, throughput: 314.14 | 2022-04-11 08:00:27.990 [rank:1] [train], epoch: 48/50, iter: 600/834, loss: 0.23431, lr: 0.002485, top1: 0.78552, throughput: 314.32 | 2022-04-11 08:00:28.004 [rank:3] [train], epoch: 48/50, iter: 600/834, loss: 0.23314, lr: 0.002485, top1: 0.78542, throughput: 314.00 | 2022-04-11 08:00:28.013 [rank:0] [train], epoch: 48/50, iter: 700/834, loss: 0.23407, lr: 0.002041, top1: 0.78479, throughput: 313.36 | 2022-04-11 08:01:29.246 [rank:6] [train], epoch: 48/50, iter: 700/834, loss: 0.23247, lr: 0.002041, top1: 0.78651, throughput: 313.32 | 2022-04-11 08:01:29.249 [rank:2] [train], epoch: 48/50, iter: 700/834, loss: 0.23319, lr: 0.002041, top1: 0.78781, throughput: 313.16 | 2022-04-11 08:01:29.271 [rank:7] [train], epoch: 48/50, iter: 700/834, loss: 0.23513, lr: 0.002041, top1: 0.78307, throughput: 313.11 | 2022-04-11 08:01:29.271 [rank:3] [train], epoch: 48/50, iter: 700/834, loss: 0.23382, lr: 0.002041, top1: 0.78438, throughput: 313.33 | 2022-04-11 08:01:29.290 [rank:1] [train], epoch: 48/50, iter: 700/834, loss: 0.23413, lr: 0.002041, top1: 0.78500, throughput: 313.20 | 2022-04-11 08:01:29.306 [rank:5] [train], epoch: 48/50, iter: 700/834, loss: 0.23360, lr: 0.002041, top1: 0.78615, throughput: 313.02 | 2022-04-11 08:01:29.306 [rank:4] [train], epoch: 48/50, iter: 700/834, loss: 0.23165, lr: 0.002041, top1: 0.78839, throughput: 313.05 | 2022-04-11 08:01:29.322 [rank:5] [train], epoch: 48/50, iter: 800/834, loss: 0.23205, lr: 0.001642, top1: 0.78510, throughput: 314.04 | 2022-04-11 08:02:30.444 [rank:6] [train], epoch: 48/50, iter: 800/834, loss: 0.23365, lr: 0.001642, top1: 0.78708, throughput: 313.65 | 2022-04-11 08:02:30.464 [rank:7] [train], epoch: 48/50, iter: 800/834, loss: 0.23257, lr: 0.001642, top1: 0.78760, throughput: 313.71 | 2022-04-11 08:02:30.473 [rank:2] [train], epoch: 48/50, iter: 800/834, loss: 0.23268, lr: 0.001642, top1: 0.78901, throughput: 313.70 | 2022-04-11 08:02:30.477 [rank:3] [train], epoch: 48/50, iter: 800/834, loss: 0.23166, lr: 0.001642, top1: 0.79203, throughput: 313.65 | 2022-04-11 08:02:30.505 [rank:4] [train], epoch: 48/50, iter: 800/834, loss: 0.23026, lr: 0.001642, top1: 0.79286, throughput: 313.80 | 2022-04-11 08:02:30.507 [rank:1] [train], epoch: 48/50, iter: 800/834, loss: 0.23287, lr: 0.001642, top1: 0.78594, throughput: 313.69 | 2022-04-11 08:02:30.513 [rank:0] [train], epoch: 48/50, iter: 800/834, loss: 0.23120, lr: 0.001642, top1: 0.78953, throughput: 313.24 | 2022-04-11 08:02:30.540 [rank:2] [train], epoch: 48/50, iter: 834/834, loss: 0.23633, lr: 0.001515, top1: 0.78232, throughput: 313.87 | 2022-04-11 08:02:51.275 [rank:0] [train], epoch: 48/50, iter: 834/834, loss: 0.23286, lr: 0.001515, top1: 0.79029, throughput: 314.25 | 2022-04-11 08:02:51.313 [rank:6] [train], epoch: 48/50, iter: 834/834, loss: 0.23220, lr: 0.001515, top1: 0.78722, throughput: 312.92 | 2022-04-11 08:02:51.326 [rank:4] [train], epoch: 48/50, iter: 834/834, loss: 0.23076, lr: 0.001515, top1: 0.78860, throughput: 313.56 | 2022-04-11 08:02:51.326 [rank:7] [train], epoch: 48/50, iter: 834/834, loss: 0.23318, lr: 0.001515, top1: 0.78477, throughput: 313.02 | 2022-04-11 08:02:51.328 [rank:3] [train], epoch: 48/50, iter: 834/834, loss: 0.23316, lr: 0.001515, top1: 0.78294, throughput: 313.48 | 2022-04-11 08:02:51.329 [rank:5] [train], epoch: 48/50, iter: 834/834, loss: 0.23296, lr: 0.001515, top1: 0.78585, throughput: 312.54 | 2022-04-11 08:02:51.331 [rank:1] [train], epoch: 48/50, iter: 834/834, loss: 0.23414, lr: 0.001515, top1: 0.77926, throughput: 313.27 | 2022-04-11 08:02:51.351 [rank:0] [eval], epoch: 48/50, iter: 125/125, loss: 0.00000, lr: 0.001515, top1: 0.76528, throughput: 489.06 | 2022-04-11 08:03:04.093 [rank:3] [eval], epoch: 48/50, iter: 125/125, loss: 0.00000, lr: 0.001515, top1: 0.76064, throughput: 489.32 | 2022-04-11 08:03:04.102 [rank:4] [eval], epoch: 48/50, iter: 125/125, loss: 0.00000, lr: 0.001515, top1: 0.76000, throughput: 488.89 | 2022-04-11 08:03:04.110 [rank:7] [eval], epoch: 48/50, iter: 125/125, loss: 0.00000, lr: 0.001515, top1: 0.76960, throughput: 488.91 | 2022-04-11 08:03:04.112 [rank:5] [eval], epoch: 48/50, iter: 125/125, loss: 0.00000, lr: 0.001515, top1: 0.75920, throughput: 488.27 | 2022-04-11 08:03:04.131 [rank:2] [eval], epoch: 48/50, iter: 125/125, loss: 0.00000, lr: 0.001515, top1: 0.75376, throughput: 485.66 | 2022-04-11 08:03:04.144 [rank:1] [eval], epoch: 48/50, iter: 125/125, loss: 0.00000, lr: 0.001515, top1: 0.77200, throughput: 487.81 | 2022-04-11 08:03:04.163 [rank:6] [eval], epoch: 48/50, iter: 125/125, loss: 0.00000, lr: 0.001515, top1: 0.76992, throughput: 486.06 | 2022-04-11 08:03:04.184 [rank:6] [train], epoch: 49/50, iter: 100/834, loss: 0.23264, lr: 0.001174, top1: 0.78464, throughput: 314.58 | 2022-04-11 08:04:05.217 [rank:4] [train], epoch: 49/50, iter: 100/834, loss: 0.23110, lr: 0.001174, top1: 0.78875, throughput: 314.12 | 2022-04-11 08:04:05.234 [rank:0] [train], epoch: 49/50, iter: 100/834, loss: 0.23129, lr: 0.001174, top1: 0.79083, throughput: 313.84 | 2022-04-11 08:04:05.271 [rank:2] [train], epoch: 49/50, iter: 100/834, loss: 0.23127, lr: 0.001174, top1: 0.78901, throughput: 314.10 | 2022-04-11 08:04:05.271 [rank:3] [train], epoch: 49/50, iter: 100/834, loss: 0.23390, lr: 0.001174, top1: 0.78599, throughput: 313.85 | 2022-04-11 08:04:05.278 [rank:7] [train], epoch: 49/50, iter: 100/834, loss: 0.23341, lr: 0.001174, top1: 0.78422, throughput: 313.87 | 2022-04-11 08:04:05.283 [rank:5] [train], epoch: 49/50, iter: 100/834, loss: 0.23289, lr: 0.001174, top1: 0.79198, throughput: 313.67 | 2022-04-11 08:04:05.343 [rank:1] [train], epoch: 49/50, iter: 100/834, loss: 0.23360, lr: 0.001174, top1: 0.78568, throughput: 314.23 | 2022-04-11 08:04:05.265 [rank:4] [train], epoch: 49/50, iter: 200/834, loss: 0.23063, lr: 0.000876, top1: 0.79688, throughput: 312.51 | 2022-04-11 08:05:06.672 [rank:3] [train], epoch: 49/50, iter: 200/834, loss: 0.23151, lr: 0.000876, top1: 0.78823, throughput: 312.68 | 2022-04-11 08:05:06.683 [rank:5] [train], epoch: 49/50, iter: 200/834, loss: 0.23187, lr: 0.000876, top1: 0.79109, throughput: 312.96 | 2022-04-11 08:05:06.692 [rank:2] [train], epoch: 49/50, iter: 200/834, loss: 0.23224, lr: 0.000876, top1: 0.78672, throughput: 312.45 | 2022-04-11 08:05:06.721 [rank:7] [train], epoch: 49/50, iter: 200/834, loss: 0.23294, lr: 0.000876, top1: 0.78635, throughput: 312.44 | 2022-04-11 08:05:06.735 [rank:1] [train], epoch: 49/50, iter: 200/834, loss: 0.23594, lr: 0.000876, top1: 0.78016, throughput: 312.21 | 2022-04-11 08:05:06.762 [rank:0] [train], epoch: 49/50, iter: 200/834, loss: 0.23239, lr: 0.000876, top1: 0.78469, throughput: 312.22 | 2022-04-11 08:05:06.765 [rank:6] [train], epoch: 49/50, iter: 200/834, loss: 0.23122, lr: 0.000876, top1: 0.78802, throughput: 311.91 | 2022-04-11 08:05:06.774 [rank:3] [train], epoch: 49/50, iter: 300/834, loss: 0.23083, lr: 0.000621, top1: 0.78865, throughput: 315.35 | 2022-04-11 08:06:07.568 [rank:7] [train], epoch: 49/50, iter: 300/834, loss: 0.23292, lr: 0.000621, top1: 0.78885, throughput: 315.50 | 2022-04-11 08:06:07.590 [rank:0] [train], epoch: 49/50, iter: 300/834, loss: 0.23062, lr: 0.000621, top1: 0.78990, throughput: 315.53 | 2022-04-11 08:06:07.615 [rank:5] [train], epoch: 49/50, iter: 300/834, loss: 0.23234, lr: 0.000621, top1: 0.78818, throughput: 315.11 | 2022-04-11 08:06:07.623 [rank:1] [train], epoch: 49/50, iter: 300/834, loss: 0.23293, lr: 0.000621, top1: 0.78167, throughput: 315.42 | 2022-04-11 08:06:07.633 [rank:4] [train], epoch: 49/50, iter: 300/834, loss: 0.23217, lr: 0.000621, top1: 0.78755, throughput: 314.94 | 2022-04-11 08:06:07.637 [rank:2] [train], epoch: 49/50, iter: 300/834, loss: 0.23350, lr: 0.000621, top1: 0.78661, throughput: 315.11 | 2022-04-11 08:06:07.653 [rank:6] [train], epoch: 49/50, iter: 300/834, loss: 0.23231, lr: 0.000621, top1: 0.78385, throughput: 315.22 | 2022-04-11 08:06:07.683 [rank:4] [train], epoch: 49/50, iter: 400/834, loss: 0.23280, lr: 0.000410, top1: 0.79068, throughput: 313.48 | 2022-04-11 08:07:08.886 [rank:6] [train], epoch: 49/50, iter: 400/834, loss: 0.23139, lr: 0.000410, top1: 0.79109, throughput: 313.50 | 2022-04-11 08:07:08.926 [rank:7] [train], epoch: 49/50, iter: 400/834, loss: 0.23101, lr: 0.000410, top1: 0.78771, throughput: 312.94 | 2022-04-11 08:07:08.943 [rank:5] [train], epoch: 49/50, iter: 400/834, loss: 0.23244, lr: 0.000410, top1: 0.78667, throughput: 313.08 | 2022-04-11 08:07:08.950 [rank:1] [train], epoch: 49/50, iter: 400/834, loss: 0.23296, lr: 0.000410, top1: 0.78557, throughput: 313.13 | 2022-04-11 08:07:08.950 [rank:2] [train], epoch: 49/50, iter: 400/834, loss: 0.23194, lr: 0.000410, top1: 0.79016, throughput: 313.20 | 2022-04-11 08:07:08.956 [rank:0] [train], epoch: 49/50, iter: 400/834, loss: 0.23148, lr: 0.000410, top1: 0.79120, throughput: 312.92 | 2022-04-11 08:07:08.973 [rank:3] [train], epoch: 49/50, iter: 400/834, loss: 0.23475, lr: 0.000410, top1: 0.78339, throughput: 312.66 | 2022-04-11 08:07:08.976 [rank:0] [train], epoch: 49/50, iter: 500/834, loss: 0.22984, lr: 0.000243, top1: 0.79281, throughput: 313.41 | 2022-04-11 08:08:10.236 [rank:7] [train], epoch: 49/50, iter: 500/834, loss: 0.23340, lr: 0.000243, top1: 0.78349, throughput: 313.16 | 2022-04-11 08:08:10.255 [rank:4] [train], epoch: 49/50, iter: 500/834, loss: 0.23197, lr: 0.000243, top1: 0.78557, throughput: 312.86 | 2022-04-11 08:08:10.256 [rank:6] [train], epoch: 49/50, iter: 500/834, loss: 0.23286, lr: 0.000243, top1: 0.78620, throughput: 313.01 | 2022-04-11 08:08:10.266 [rank:5] [train], epoch: 49/50, iter: 500/834, loss: 0.23357, lr: 0.000243, top1: 0.78573, throughput: 313.12 | 2022-04-11 08:08:10.268 [rank:1] [train], epoch: 49/50, iter: 500/834, loss: 0.23145, lr: 0.000243, top1: 0.78927, throughput: 313.08 | 2022-04-11 08:08:10.277 [rank:2] [train], epoch: 49/50, iter: 500/834, loss: 0.23426, lr: 0.000243, top1: 0.78339, throughput: 313.04 | 2022-04-11 08:08:10.290 [rank:3] [train], epoch: 49/50, iter: 500/834, loss: 0.23018, lr: 0.000243, top1: 0.79208, throughput: 313.14 | 2022-04-11 08:08:10.290 [rank:2] [train], epoch: 49/50, iter: 600/834, loss: 0.23275, lr: 0.000119, top1: 0.78661, throughput: 314.97 | 2022-04-11 08:09:11.247 [rank:5] [train], epoch: 49/50, iter: 600/834, loss: 0.23127, lr: 0.000119, top1: 0.78891, throughput: 314.70 | 2022-04-11 08:09:11.280 [rank:7] [train], epoch: 49/50, iter: 600/834, loss: 0.23266, lr: 0.000119, top1: 0.78818, throughput: 314.58 | 2022-04-11 08:09:11.288 [rank:3] [train], epoch: 49/50, iter: 600/834, loss: 0.23380, lr: 0.000119, top1: 0.78776, throughput: 314.76 | 2022-04-11 08:09:11.288 [rank:6] [train], epoch: 49/50, iter: 600/834, loss: 0.23338, lr: 0.000119, top1: 0.78521, throughput: 314.58 | 2022-04-11 08:09:11.300 [rank:4] [train], epoch: 49/50, iter: 600/834, loss: 0.23297, lr: 0.000119, top1: 0.78552, throughput: 314.87 | 2022-04-11 08:09:11.234 [rank:0] [train], epoch: 49/50, iter: 600/834, loss: 0.23025, lr: 0.000119, top1: 0.79057, throughput: 314.27 | 2022-04-11 08:09:11.330 [rank:1] [train], epoch: 49/50, iter: 600/834, loss: 0.23190, lr: 0.000119, top1: 0.79156, throughput: 314.92 | 2022-04-11 08:09:11.245 [rank:0] [train], epoch: 49/50, iter: 700/834, loss: 0.23069, lr: 0.000039, top1: 0.79224, throughput: 312.39 | 2022-04-11 08:10:12.791 [rank:2] [train], epoch: 49/50, iter: 700/834, loss: 0.23230, lr: 0.000039, top1: 0.78932, throughput: 311.97 | 2022-04-11 08:10:12.792 [rank:1] [train], epoch: 49/50, iter: 700/834, loss: 0.23138, lr: 0.000039, top1: 0.78958, throughput: 311.91 | 2022-04-11 08:10:12.802 [rank:4] [train], epoch: 49/50, iter: 700/834, loss: 0.23312, lr: 0.000039, top1: 0.78891, throughput: 311.80 | 2022-04-11 08:10:12.812 [rank:3] [train], epoch: 49/50, iter: 700/834, loss: 0.23234, lr: 0.000039, top1: 0.78563, throughput: 312.02 | 2022-04-11 08:10:12.823 [rank:5] [train], epoch: 49/50, iter: 700/834, loss: 0.23201, lr: 0.000039, top1: 0.78839, throughput: 311.89 | 2022-04-11 08:10:12.840 [rank:6] [train], epoch: 49/50, iter: 700/834, loss: 0.23261, lr: 0.000039, top1: 0.78781, throughput: 312.41 | 2022-04-11 08:10:12.758 [rank:7] [train], epoch: 49/50, iter: 700/834, loss: 0.23309, lr: 0.000039, top1: 0.78646, throughput: 311.66 | 2022-04-11 08:10:12.893 [rank:4] [train], epoch: 49/50, iter: 800/834, loss: 0.23331, lr: 0.000003, top1: 0.78724, throughput: 312.39 | 2022-04-11 08:11:14.273 [rank:0] [train], epoch: 49/50, iter: 800/834, loss: 0.23229, lr: 0.000003, top1: 0.78812, throughput: 312.25 | 2022-04-11 08:11:14.280 [rank:3] [train], epoch: 49/50, iter: 800/834, loss: 0.23241, lr: 0.000003, top1: 0.78568, throughput: 312.29 | 2022-04-11 08:11:14.305 [rank:1] [train], epoch: 49/50, iter: 800/834, loss: 0.23096, lr: 0.000003, top1: 0.79344, throughput: 312.14 | 2022-04-11 08:11:14.313 [rank:2] [train], epoch: 49/50, iter: 800/834, loss: 0.23255, lr: 0.000003, top1: 0.78547, throughput: 312.06 | 2022-04-11 08:11:14.319 [rank:5] [train], epoch: 49/50, iter: 800/834, loss: 0.23146, lr: 0.000003, top1: 0.79021, throughput: 312.30 | 2022-04-11 08:11:14.320 [rank:7] [train], epoch: 49/50, iter: 800/834, loss: 0.23043, lr: 0.000003, top1: 0.79000, throughput: 312.54 | 2022-04-11 08:11:14.326 [rank:6] [train], epoch: 49/50, iter: 800/834, loss: 0.23381, lr: 0.000003, top1: 0.78193, throughput: 311.79 | 2022-04-11 08:11:14.338 [rank:4] [train], epoch: 49/50, iter: 834/834, loss: 0.23319, lr: 0.000000, top1: 0.79059, throughput: 310.13 | 2022-04-11 08:11:35.322 [rank:2] [train], epoch: 49/50, iter: 834/834, loss: 0.22918, lr: 0.000000, top1: 0.79059, throughput: 310.62 | 2022-04-11 08:11:35.335 [rank:1] [train], epoch: 49/50, iter: 834/834, loss: 0.23242, lr: 0.000000, top1: 0.79167, throughput: 310.51 | 2022-04-11 08:11:35.336 [rank:5] [train], epoch: 49/50, iter: 834/834, loss: 0.23375, lr: 0.000000, top1: 0.78585, throughput: 310.56 | 2022-04-11 08:11:35.340 [rank:7] [train], epoch: 49/50, iter: 834/834, loss: 0.23100, lr: 0.000000, top1: 0.78814, throughput: 310.36 | 2022-04-11 08:11:35.359 [rank:3] [train], epoch: 49/50, iter: 834/834, loss: 0.23177, lr: 0.000000, top1: 0.79611, throughput: 309.96 | 2022-04-11 08:11:35.366 [rank:6] [train], epoch: 49/50, iter: 834/834, loss: 0.22936, lr: 0.000000, top1: 0.79381, throughput: 310.44 | 2022-04-11 08:11:35.366 [rank:0] [train], epoch: 49/50, iter: 834/834, loss: 0.23337, lr: 0.000000, top1: 0.78569, throughput: 309.28 | 2022-04-11 08:11:35.387 [rank:5] [eval], epoch: 49/50, iter: 125/125, loss: 0.00000, lr: 0.000000, top1: 0.75728, throughput: 488.37 | 2022-04-11 08:11:48.137 [rank:7] [eval], epoch: 49/50, iter: 125/125, loss: 0.00000, lr: 0.000000, top1: 0.76896, throughput: 489.11 | 2022-04-11 08:11:48.138 [rank:2] [eval], epoch: 49/50, iter: 125/125, loss: 0.00000, lr: 0.000000, top1: 0.75296, throughput: 488.14 | 2022-04-11 08:11:48.138 [rank:3] [eval], epoch: 49/50, iter: 125/125, loss: 0.00000, lr: 0.000000, top1: 0.76048, throughput: 489.32 | 2022-04-11 08:11:48.138 [rank:4] [eval], epoch: 49/50, iter: 125/125, loss: 0.00000, lr: 0.000000, top1: 0.76032, throughput: 487.66 | 2022-04-11 08:11:48.138 [rank:6] [eval], epoch: 49/50, iter: 125/125, loss: 0.00000, lr: 0.000000, top1: 0.76848, throughput: 489.20 | 2022-04-11 08:11:48.142 [rank:0] [eval], epoch: 49/50, iter: 125/125, loss: 0.00000, lr: 0.000000, top1: 0.76384, throughput: 490.00 | 2022-04-11 08:11:48.142 [rank:1] [eval], epoch: 49/50, iter: 125/125, loss: 0.00000, lr: 0.000000, top1: 0.77088, throughput: 486.32 | 2022-04-11 08:11:48.188