loaded library: /usr/lib/x86_64-linux-gnu/libibverbs.so.1 ***************************************** Setting OMP_NUM_THREADS environment variable for each process to be 1 in default, to avoid your system being overloaded, please further tune the variable for optimal performance in your application as needed. ***************************************** loaded library: /usr/lib/x86_64-linux-gnu/libibverbs.so.1 loaded library: /usr/lib/x86_64-linux-gnu/libibverbs.so.1 loaded library: loaded library: loaded library: /usr/lib/x86_64-linux-gnu/libibverbs.so.1 /usr/lib/x86_64-linux-gnu/libibverbs.so.1loaded library: loaded library: /usr/lib/x86_64-linux-gnu/libibverbs.so.1loaded library: /usr/lib/x86_64-linux-gnu/libibverbs.so.1 /usr/lib/x86_64-linux-gnu/libibverbs.so.1 /usr/lib/x86_64-linux-gnu/libibverbs.so.1 ------------------------ arguments ------------------------ batch_size ...................................... 131072 batch_size_per_proc ............................. 16384 data_dir ........................................ /dataset/f9f659c5/wdl_ofrecord data_part_name_suffix_length .................... 5 data_part_num ................................... 256 dataset_format .................................. ofrecord ddp ............................................. True deep_dropout_rate ............................... 0.5 deep_embedding_vec_size ......................... 16 deep_vocab_size ................................. 2322444 eval_after_training ............................. False eval_batchs ..................................... 20 eval_interval ................................... 0 execution_mode .................................. eager hidden_size ..................................... 1024 hidden_units_num ................................ 2 learning_rate ................................... 0.001 loss_print_every_n_iter ......................... 100 max_iter ........................................ 1100 model_load_dir .................................. model_save_dir .................................. ./checkpoint num_deep_sparse_fields .......................... 26 num_dense_fields ................................ 13 num_wide_sparse_fields .......................... 2 save_initial_model .............................. False save_model_after_each_eval ...................... False test_name ....................................... noname_test wide_vocab_size ................................. 2322444 -------------------- end of arguments --------------------- [rank:0] iter: 100/1100, loss: 0.5026984214782715, latency(ms): 95.1986300572752953 | 2022-05-10 02:40:13.747 timestamp, name, driver_version, utilization.gpu [%], utilization.memory [%], memory.total [MiB], memory.free [MiB], memory.used [MiB] 2022/05/10 02:40:13.897, Tesla V100-SXM2-32GB, 470.57.02, 31 %, 8 %, 32510 MiB, 29888 MiB, 2622 MiB timestamp, name, driver_version, utilization.gpu [%], utilization.memory [%], memory.total [MiB], memory.free [MiB], memory.used [MiB] 2022/05/10 02:40:13.906, Tesla V100-SXM2-32GB, 470.57.02, 27 %, 8 %, 32510 MiB, 29908 MiB, 2602 MiB timestamp, name, driver_version, utilization.gpu [%], utilization.memory [%], memory.total [MiB], memory.free [MiB], memory.used [MiB] timestamp, name, driver_version, utilization.gpu [%], utilization.memory [%], memory.total [MiB], memory.free [MiB], memory.used [MiB] 2022/05/10 02:40:13.909, Tesla V100-SXM2-32GB, 470.57.02, 31 %, 8 %, 32510 MiB, 29888 MiB, 2622 MiB 2022/05/10 02:40:13.911, Tesla V100-SXM2-32GB, 470.57.02, 14 %, 3 %, 32510 MiB, 29984 MiB, 2526 MiB 2022/05/10 02:40:13.913, Tesla V100-SXM2-32GB, 470.57.02, 31 %, 8 %, 32510 MiB, 29888 MiB, 2622 MiB 2022/05/10 02:40:13.915, Tesla V100-SXM2-32GB, 470.57.02, 31 %, 8 %, 32510 MiB, 29888 MiB, 2622 MiB timestamp, name, driver_version, utilization.gpu [%], utilization.memory [%], memory.total [MiB], memory.free [MiB], memory.used [MiB] timestamp, name, driver_version, utilization.gpu [%], utilization.memory [%], memory.total [MiB], memory.free [MiB], memory.used [MiB] 2022/05/10 02:40:13.918, Tesla V100-SXM2-32GB, 470.57.02, 27 %, 8 %, 32510 MiB, 29908 MiB, 2602 MiB 2022/05/10 02:40:13.920, Tesla V100-SXM2-32GB, 470.57.02, 15 %, 9 %, 32510 MiB, 29960 MiB, 2550 MiB 2022/05/10 02:40:13.923, Tesla V100-SXM2-32GB, 470.57.02, 27 %, 8 %, 32510 MiB, 29908 MiB, 2602 MiB 2022/05/10 02:40:13.924, Tesla V100-SXM2-32GB, 470.57.02, 27 %, 8 %, 32510 MiB, 29908 MiB, 2602 MiB 2022/05/10 02:40:13.924, Tesla V100-SXM2-32GB, 470.57.02, 31 %, 8 %, 32510 MiB, 29888 MiB, 2622 MiB 2022/05/10 02:40:13.927, Tesla V100-SXM2-32GB, 470.57.02, 14 %, 3 %, 32510 MiB, 29984 MiB, 2526 MiB 2022/05/10 02:40:13.926, Tesla V100-SXM2-32GB, 470.57.02, 31 %, 8 %, 32510 MiB, 29888 MiB, 2622 MiB 2022/05/10 02:40:13.929, Tesla V100-SXM2-32GB, 470.57.02, 67 %, 21 %, 32510 MiB, 29968 MiB, 2542 MiB 2022/05/10 02:40:13.932, Tesla V100-SXM2-32GB, 470.57.02, 14 %, 3 %, 32510 MiB, 29984 MiB, 2526 MiB 2022/05/10 02:40:13.933, Tesla V100-SXM2-32GB, 470.57.02, 14 %, 3 %, 32510 MiB, 29984 MiB, 2526 MiB timestamp, name, driver_version, utilization.gpu [%], utilization.memory [%], memory.total [MiB], memory.free [MiB], memory.used [MiB] 2022/05/10 02:40:13.935, Tesla V100-SXM2-32GB, 470.57.02, 27 %, 8 %, 32510 MiB, 29908 MiB, 2602 MiB 2022/05/10 02:40:13.935, Tesla V100-SXM2-32GB, 470.57.02, 15 %, 9 %, 32510 MiB, 29960 MiB, 2550 MiB 2022/05/10 02:40:13.936, Tesla V100-SXM2-32GB, 470.57.02, 27 %, 8 %, 32510 MiB, 29908 MiB, 2602 MiB 2022/05/10 02:40:13.937, Tesla V100-SXM2-32GB, 470.57.02, 4 %, 2 %, 32510 MiB, 29900 MiB, 2610 MiB 2022/05/10 02:40:13.940, Tesla V100-SXM2-32GB, 470.57.02, 15 %, 9 %, 32510 MiB, 29960 MiB, 2550 MiB 2022/05/10 02:40:13.942, Tesla V100-SXM2-32GB, 470.57.02, 15 %, 9 %, 32510 MiB, 29960 MiB, 2550 MiB 2022/05/10 02:40:13.942, Tesla V100-SXM2-32GB, 470.57.02, 31 %, 8 %, 32510 MiB, 29888 MiB, 2622 MiB 2022/05/10 02:40:13.943, Tesla V100-SXM2-32GB, 470.57.02, 14 %, 3 %, 32510 MiB, 29984 MiB, 2526 MiB 2022/05/10 02:40:13.944, Tesla V100-SXM2-32GB, 470.57.02, 0 %, 0 %, 32510 MiB, 29968 MiB, 2542 MiB 2022/05/10 02:40:13.945, Tesla V100-SXM2-32GB, 470.57.02, 14 %, 3 %, 32510 MiB, 29984 MiB, 2526 MiB 2022/05/10 02:40:13.946, Tesla V100-SXM2-32GB, 470.57.02, 47 %, 15 %, 32510 MiB, 29844 MiB, 2666 MiB 2022/05/10 02:40:13.949, Tesla V100-SXM2-32GB, 470.57.02, 0 %, 0 %, 32510 MiB, 29968 MiB, 2542 MiB 2022/05/10 02:40:13.951, Tesla V100-SXM2-32GB, 470.57.02, 0 %, 0 %, 32510 MiB, 29968 MiB, 2542 MiB 2022/05/10 02:40:13.952, Tesla V100-SXM2-32GB, 470.57.02, 27 %, 8 %, 32510 MiB, 29908 MiB, 2602 MiB 2022/05/10 02:40:13.952, Tesla V100-SXM2-32GB, 470.57.02, 15 %, 9 %, 32510 MiB, 29960 MiB, 2550 MiB 2022/05/10 02:40:13.953, Tesla V100-SXM2-32GB, 470.57.02, 4 %, 2 %, 32510 MiB, 29900 MiB, 2610 MiB 2022/05/10 02:40:13.954, Tesla V100-SXM2-32GB, 470.57.02, 15 %, 9 %, 32510 MiB, 29960 MiB, 2550 MiB 2022/05/10 02:40:13.955, Tesla V100-SXM2-32GB, 470.57.02, 0 %, 0 %, 32510 MiB, 29924 MiB, 2586 MiB 2022/05/10 02:40:13.959, Tesla V100-SXM2-32GB, 470.57.02, 4 %, 2 %, 32510 MiB, 29900 MiB, 2610 MiB 2022/05/10 02:40:13.960, Tesla V100-SXM2-32GB, 470.57.02, 4 %, 2 %, 32510 MiB, 29900 MiB, 2610 MiB timestamp, name, driver_version, utilization.gpu [%], utilization.memory [%], memory.total [MiB], memory.free [MiB], memory.used [MiB] 2022/05/10 02:40:13.961, Tesla V100-SXM2-32GB, 470.57.02, 14 %, 3 %, 32510 MiB, 29984 MiB, 2526 MiB 2022/05/10 02:40:13.962, Tesla V100-SXM2-32GB, 470.57.02, 0 %, 0 %, 32510 MiB, 29968 MiB, 2542 MiB 2022/05/10 02:40:13.962, Tesla V100-SXM2-32GB, 470.57.02, 47 %, 15 %, 32510 MiB, 29844 MiB, 2666 MiB 2022/05/10 02:40:13.963, Tesla V100-SXM2-32GB, 470.57.02, 0 %, 0 %, 32510 MiB, 29968 MiB, 2542 MiB 2022/05/10 02:40:13.967, Tesla V100-SXM2-32GB, 470.57.02, 47 %, 15 %, 32510 MiB, 29844 MiB, 2666 MiB 2022/05/10 02:40:13.968, Tesla V100-SXM2-32GB, 470.57.02, 47 %, 15 %, 32510 MiB, 29844 MiB, 2666 MiB 2022/05/10 02:40:13.970, Tesla V100-SXM2-32GB, 470.57.02, 15 %, 9 %, 32510 MiB, 29960 MiB, 2550 MiB 2022/05/10 02:40:13.970, Tesla V100-SXM2-32GB, 470.57.02, 4 %, 2 %, 32510 MiB, 29900 MiB, 2610 MiB 2022/05/10 02:40:13.970, Tesla V100-SXM2-32GB, 470.57.02, 31 %, 8 %, 32510 MiB, 29888 MiB, 2622 MiB 2022/05/10 02:40:13.971, Tesla V100-SXM2-32GB, 470.57.02, 0 %, 0 %, 32510 MiB, 29924 MiB, 2586 MiB 2022/05/10 02:40:13.972, Tesla V100-SXM2-32GB, 470.57.02, 4 %, 2 %, 32510 MiB, 29900 MiB, 2610 MiB 2022/05/10 02:40:13.976, Tesla V100-SXM2-32GB, 470.57.02, 0 %, 0 %, 32510 MiB, 29924 MiB, 2586 MiB 2022/05/10 02:40:13.977, Tesla V100-SXM2-32GB, 470.57.02, 0 %, 0 %, 32510 MiB, 29924 MiB, 2586 MiB 2022/05/10 02:40:13.979, Tesla V100-SXM2-32GB, 470.57.02, 0 %, 0 %, 32510 MiB, 29968 MiB, 2542 MiB 2022/05/10 02:40:13.979, Tesla V100-SXM2-32GB, 470.57.02, 0 %, 0 %, 32510 MiB, 29844 MiB, 2666 MiB 2022/05/10 02:40:13.980, Tesla V100-SXM2-32GB, 470.57.02, 27 %, 8 %, 32510 MiB, 29908 MiB, 2602 MiB 2022/05/10 02:40:13.980, Tesla V100-SXM2-32GB, 470.57.02, 0 %, 0 %, 32510 MiB, 29844 MiB, 2666 MiB 2022/05/10 02:40:13.988, Tesla V100-SXM2-32GB, 470.57.02, 4 %, 2 %, 32510 MiB, 29900 MiB, 2610 MiB 2022/05/10 02:40:13.988, Tesla V100-SXM2-32GB, 470.57.02, 0 %, 0 %, 32510 MiB, 29924 MiB, 2586 MiB 2022/05/10 02:40:13.989, Tesla V100-SXM2-32GB, 470.57.02, 14 %, 3 %, 32510 MiB, 29984 MiB, 2526 MiB 2022/05/10 02:40:13.989, Tesla V100-SXM2-32GB, 470.57.02, 0 %, 0 %, 32510 MiB, 29924 MiB, 2586 MiB 2022/05/10 02:40:13.996, Tesla V100-SXM2-32GB, 470.57.02, 0 %, 0 %, 32510 MiB, 29844 MiB, 2666 MiB 2022/05/10 02:40:13.996, Tesla V100-SXM2-32GB, 470.57.02, 15 %, 9 %, 32510 MiB, 29960 MiB, 2550 MiB 2022/05/10 02:40:14.006, Tesla V100-SXM2-32GB, 470.57.02, 0 %, 0 %, 32510 MiB, 29924 MiB, 2586 MiB 2022/05/10 02:40:14.007, Tesla V100-SXM2-32GB, 470.57.02, 0 %, 0 %, 32510 MiB, 29968 MiB, 2542 MiB 2022/05/10 02:40:14.015, Tesla V100-SXM2-32GB, 470.57.02, 4 %, 2 %, 32510 MiB, 29900 MiB, 2610 MiB 2022/05/10 02:40:14.028, Tesla V100-SXM2-32GB, 470.57.02, 0 %, 0 %, 32510 MiB, 29844 MiB, 2666 MiB 2022/05/10 02:40:14.039, Tesla V100-SXM2-32GB, 470.57.02, 0 %, 0 %, 32510 MiB, 29924 MiB, 2586 MiB [rank:0] iter: 200/1100, loss: 0.4698213338851929, latency(ms): 41.6776216775178909 | 2022-05-10 02:40:17.915 [rank:0] iter: 300/1100, loss: 0.4608387053012848, latency(ms): 39.8735262453556061 | 2022-05-10 02:40:21.902 [rank:0] iter: 400/1100, loss: 0.4522458016872406, latency(ms): 39.9575987458229065 | 2022-05-10 02:40:25.898 [rank:0] iter: 500/1100, loss: 0.4503375589847565, latency(ms): 40.6676477193832397 | 2022-05-10 02:40:29.965 [rank:0] iter: 600/1100, loss: 0.4463795125484467, latency(ms): 41.1789874732494354 | 2022-05-10 02:40:34.083 [rank:0] iter: 700/1100, loss: 0.4401709437370300, latency(ms): 41.9284480810165405 | 2022-05-10 02:40:38.276 [rank:0] iter: 800/1100, loss: 0.4423676729202271, latency(ms): 41.8719954788684845 | 2022-05-10 02:40:42.463 [rank:0] iter: 900/1100, loss: 0.4324282109737396, latency(ms): 42.9501030221581459 | 2022-05-10 02:40:46.758 [rank:0] iter: 1000/1100, loss: 0.4311335086822510, latency(ms): 43.4146095067262650 | 2022-05-10 02:40:51.099 [rank:0] iter: 1100/1100, loss: 0.4326019287109375, latency(ms): 44.0453243255615234 | 2022-05-10 02:40:55.504