loaded library: /usr/lib/x86_64-linux-gnu/libibverbs.so.1 ***************************************** Setting OMP_NUM_THREADS environment variable for each process to be 1 in default, to avoid your system being overloaded, please further tune the variable for optimal performance in your application as needed. ***************************************** loaded library: loaded library: loaded library: /usr/lib/x86_64-linux-gnu/libibverbs.so.1/usr/lib/x86_64-linux-gnu/libibverbs.so.1/usr/lib/x86_64-linux-gnu/libibverbs.so.1 loaded library: /usr/lib/x86_64-linux-gnu/libibverbs.so.1 loaded library: loaded library: /usr/lib/x86_64-linux-gnu/libibverbs.so.1/usr/lib/x86_64-linux-gnu/libibverbs.so.1 loaded library: /usr/lib/x86_64-linux-gnu/libibverbs.so.1 loaded library: /usr/lib/x86_64-linux-gnu/libibverbs.so.1 ------------------------ arguments ------------------------ batch_size ...................................... 65536 batch_size_per_proc ............................. 8192 data_dir ........................................ /dataset/f9f659c5/wdl_ofrecord data_part_name_suffix_length .................... 5 data_part_num ................................... 256 dataset_format .................................. ofrecord ddp ............................................. False deep_dropout_rate ............................... 0.5 deep_embedding_vec_size ......................... 16 deep_vocab_size ................................. 2322444 eval_after_training ............................. False eval_batchs ..................................... 20 eval_interval ................................... 0 execution_mode .................................. graph hidden_size ..................................... 1024 hidden_units_num ................................ 2 learning_rate ................................... 0.001 loss_print_every_n_iter ......................... 100 max_iter ........................................ 1100 model_load_dir .................................. model_save_dir .................................. ./checkpoint num_deep_sparse_fields .......................... 26 num_dense_fields ................................ 13 num_wide_sparse_fields .......................... 2 save_initial_model .............................. False save_model_after_each_eval ...................... False test_name ....................................... noname_test wide_vocab_size ................................. 2322444 -------------------- end of arguments --------------------- [rank:0] iter: 100/1100, loss: 0.0621693618595600, latency(ms): 186.1100142449140549 | 2022-05-15 01:58:44.319 timestamp, name, driver_version, utilization.gpu [%], utilization.memory [%], memory.total [MiB], memory.free [MiB], memory.used [MiB] timestamp, name, driver_version, utilization.gpu [%], utilization.memory [%], memory.total [MiB], memory.free [MiB], memory.used [MiB] timestamp, name, driver_version, utilization.gpu [%], utilization.memory [%], memory.total [MiB], memory.free [MiB], memory.used [MiB] 2022/05/15 01:58:44.484, Tesla V100-SXM2-32GB, 470.57.02, 0 %, 0 %, 32510 MiB, 30039 MiB, 2471 MiB timestamp, name, driver_version, utilization.gpu [%], utilization.memory [%], memory.total [MiB], memory.free [MiB], memory.used [MiB] timestamp, name, driver_version, utilization.gpu [%], utilization.memory [%], memory.total [MiB], memory.free [MiB], memory.used [MiB] 2022/05/15 01:58:44.489, Tesla V100-SXM2-32GB, 470.57.02, 0 %, 0 %, 32510 MiB, 30039 MiB, 2471 MiB 2022/05/15 01:58:44.491, Tesla V100-SXM2-32GB, 470.57.02, 84 %, 28 %, 32510 MiB, 30059 MiB, 2451 MiB 2022/05/15 01:58:44.490, Tesla V100-SXM2-32GB, 470.57.02, 0 %, 0 %, 32510 MiB, 30039 MiB, 2471 MiB timestamp, name, driver_version, utilization.gpu [%], utilization.memory [%], memory.total [MiB], memory.free [MiB], memory.used [MiB] 2022/05/15 01:58:44.491, Tesla V100-SXM2-32GB, 470.57.02, 0 %, 0 %, 32510 MiB, 30039 MiB, 2471 MiB timestamp, name, driver_version, utilization.gpu [%], utilization.memory [%], memory.total [MiB], memory.free [MiB], memory.used [MiB] 2022/05/15 01:58:44.494, Tesla V100-SXM2-32GB, 470.57.02, 0 %, 0 %, 32510 MiB, 30039 MiB, 2471 MiB 2022/05/15 01:58:44.497, Tesla V100-SXM2-32GB, 470.57.02, 0 %, 0 %, 32510 MiB, 30059 MiB, 2451 MiB timestamp, name, driver_version, utilization.gpu [%], utilization.memory [%], memory.total [MiB], memory.free [MiB], memory.used [MiB] 2022/05/15 01:58:44.498, Tesla V100-SXM2-32GB, 470.57.02, 0 %, 0 %, 32510 MiB, 30211 MiB, 2299 MiB 2022/05/15 01:58:44.499, Tesla V100-SXM2-32GB, 470.57.02, 0 %, 0 %, 32510 MiB, 30059 MiB, 2451 MiB 2022/05/15 01:58:44.499, Tesla V100-SXM2-32GB, 470.57.02, 0 %, 0 %, 32510 MiB, 30039 MiB, 2471 MiB 2022/05/15 01:58:44.500, Tesla V100-SXM2-32GB, 470.57.02, 0 %, 0 %, 32510 MiB, 30059 MiB, 2451 MiB 2022/05/15 01:58:44.501, Tesla V100-SXM2-32GB, 470.57.02, 0 %, 0 %, 32510 MiB, 30039 MiB, 2471 MiB 2022/05/15 01:58:44.502, Tesla V100-SXM2-32GB, 470.57.02, 0 %, 0 %, 32510 MiB, 30059 MiB, 2451 MiB 2022/05/15 01:58:44.504, Tesla V100-SXM2-32GB, 470.57.02, 0 %, 0 %, 32510 MiB, 30211 MiB, 2299 MiB 2022/05/15 01:58:44.505, Tesla V100-SXM2-32GB, 470.57.02, 0 %, 0 %, 32510 MiB, 30039 MiB, 2471 MiB 2022/05/15 01:58:44.506, Tesla V100-SXM2-32GB, 470.57.02, 44 %, 15 %, 32510 MiB, 30195 MiB, 2315 MiB 2022/05/15 01:58:44.507, Tesla V100-SXM2-32GB, 470.57.02, 0 %, 0 %, 32510 MiB, 30211 MiB, 2299 MiB 2022/05/15 01:58:44.508, Tesla V100-SXM2-32GB, 470.57.02, 0 %, 0 %, 32510 MiB, 30059 MiB, 2451 MiB 2022/05/15 01:58:44.509, Tesla V100-SXM2-32GB, 470.57.02, 0 %, 0 %, 32510 MiB, 30211 MiB, 2299 MiB 2022/05/15 01:58:44.511, Tesla V100-SXM2-32GB, 470.57.02, 0 %, 0 %, 32510 MiB, 30059 MiB, 2451 MiB 2022/05/15 01:58:44.511, Tesla V100-SXM2-32GB, 470.57.02, 0 %, 0 %, 32510 MiB, 30211 MiB, 2299 MiB 2022/05/15 01:58:44.514, Tesla V100-SXM2-32GB, 470.57.02, 44 %, 15 %, 32510 MiB, 30195 MiB, 2315 MiB 2022/05/15 01:58:44.516, Tesla V100-SXM2-32GB, 470.57.02, 0 %, 0 %, 32510 MiB, 30059 MiB, 2451 MiB 2022/05/15 01:58:44.516, Tesla V100-SXM2-32GB, 470.57.02, 52 %, 18 %, 32510 MiB, 30211 MiB, 2299 MiB 2022/05/15 01:58:44.517, Tesla V100-SXM2-32GB, 470.57.02, 44 %, 15 %, 32510 MiB, 30195 MiB, 2315 MiB 2022/05/15 01:58:44.518, Tesla V100-SXM2-32GB, 470.57.02, 0 %, 0 %, 32510 MiB, 30211 MiB, 2299 MiB 2022/05/15 01:58:44.518, Tesla V100-SXM2-32GB, 470.57.02, 44 %, 15 %, 32510 MiB, 30195 MiB, 2315 MiB 2022/05/15 01:58:44.521, Tesla V100-SXM2-32GB, 470.57.02, 0 %, 0 %, 32510 MiB, 30211 MiB, 2299 MiB 2022/05/15 01:58:44.522, Tesla V100-SXM2-32GB, 470.57.02, 44 %, 15 %, 32510 MiB, 30195 MiB, 2315 MiB 2022/05/15 01:58:44.524, Tesla V100-SXM2-32GB, 470.57.02, 52 %, 18 %, 32510 MiB, 30211 MiB, 2299 MiB 2022/05/15 01:58:44.526, Tesla V100-SXM2-32GB, 470.57.02, 0 %, 0 %, 32510 MiB, 30211 MiB, 2299 MiB 2022/05/15 01:58:44.526, Tesla V100-SXM2-32GB, 470.57.02, 22 %, 6 %, 32510 MiB, 30043 MiB, 2467 MiB 2022/05/15 01:58:44.527, Tesla V100-SXM2-32GB, 470.57.02, 52 %, 18 %, 32510 MiB, 30211 MiB, 2299 MiB 2022/05/15 01:58:44.528, Tesla V100-SXM2-32GB, 470.57.02, 44 %, 15 %, 32510 MiB, 30195 MiB, 2315 MiB 2022/05/15 01:58:44.528, Tesla V100-SXM2-32GB, 470.57.02, 52 %, 18 %, 32510 MiB, 30211 MiB, 2299 MiB 2022/05/15 01:58:44.531, Tesla V100-SXM2-32GB, 470.57.02, 44 %, 15 %, 32510 MiB, 30195 MiB, 2315 MiB 2022/05/15 01:58:44.531, Tesla V100-SXM2-32GB, 470.57.02, 52 %, 18 %, 32510 MiB, 30211 MiB, 2299 MiB 2022/05/15 01:58:44.534, Tesla V100-SXM2-32GB, 470.57.02, 22 %, 6 %, 32510 MiB, 30043 MiB, 2467 MiB 2022/05/15 01:58:44.536, Tesla V100-SXM2-32GB, 470.57.02, 44 %, 15 %, 32510 MiB, 30195 MiB, 2315 MiB 2022/05/15 01:58:44.536, Tesla V100-SXM2-32GB, 470.57.02, 0 %, 0 %, 32510 MiB, 29931 MiB, 2579 MiB 2022/05/15 01:58:44.537, Tesla V100-SXM2-32GB, 470.57.02, 22 %, 6 %, 32510 MiB, 30043 MiB, 2467 MiB 2022/05/15 01:58:44.538, Tesla V100-SXM2-32GB, 470.57.02, 52 %, 18 %, 32510 MiB, 30211 MiB, 2299 MiB 2022/05/15 01:58:44.538, Tesla V100-SXM2-32GB, 470.57.02, 22 %, 6 %, 32510 MiB, 30043 MiB, 2467 MiB 2022/05/15 01:58:44.541, Tesla V100-SXM2-32GB, 470.57.02, 52 %, 18 %, 32510 MiB, 30211 MiB, 2299 MiB 2022/05/15 01:58:44.541, Tesla V100-SXM2-32GB, 470.57.02, 22 %, 6 %, 32510 MiB, 30043 MiB, 2467 MiB 2022/05/15 01:58:44.544, Tesla V100-SXM2-32GB, 470.57.02, 0 %, 0 %, 32510 MiB, 29931 MiB, 2579 MiB 2022/05/15 01:58:44.546, Tesla V100-SXM2-32GB, 470.57.02, 52 %, 18 %, 32510 MiB, 30211 MiB, 2299 MiB 2022/05/15 01:58:44.546, Tesla V100-SXM2-32GB, 470.57.02, 34 %, 11 %, 32510 MiB, 30123 MiB, 2387 MiB 2022/05/15 01:58:44.547, Tesla V100-SXM2-32GB, 470.57.02, 0 %, 0 %, 32510 MiB, 29931 MiB, 2579 MiB 2022/05/15 01:58:44.548, Tesla V100-SXM2-32GB, 470.57.02, 22 %, 6 %, 32510 MiB, 30043 MiB, 2467 MiB 2022/05/15 01:58:44.548, Tesla V100-SXM2-32GB, 470.57.02, 0 %, 0 %, 32510 MiB, 29931 MiB, 2579 MiB 2022/05/15 01:58:44.551, Tesla V100-SXM2-32GB, 470.57.02, 22 %, 6 %, 32510 MiB, 30043 MiB, 2467 MiB 2022/05/15 01:58:44.552, Tesla V100-SXM2-32GB, 470.57.02, 0 %, 0 %, 32510 MiB, 29931 MiB, 2579 MiB 2022/05/15 01:58:44.554, Tesla V100-SXM2-32GB, 470.57.02, 34 %, 11 %, 32510 MiB, 30123 MiB, 2387 MiB 2022/05/15 01:58:44.556, Tesla V100-SXM2-32GB, 470.57.02, 22 %, 6 %, 32510 MiB, 30043 MiB, 2467 MiB 2022/05/15 01:58:44.557, Tesla V100-SXM2-32GB, 470.57.02, 34 %, 11 %, 32510 MiB, 30123 MiB, 2387 MiB 2022/05/15 01:58:44.558, Tesla V100-SXM2-32GB, 470.57.02, 0 %, 0 %, 32510 MiB, 29931 MiB, 2579 MiB 2022/05/15 01:58:44.559, Tesla V100-SXM2-32GB, 470.57.02, 34 %, 11 %, 32510 MiB, 30123 MiB, 2387 MiB 2022/05/15 01:58:44.562, Tesla V100-SXM2-32GB, 470.57.02, 0 %, 0 %, 32510 MiB, 29931 MiB, 2579 MiB 2022/05/15 01:58:44.562, Tesla V100-SXM2-32GB, 470.57.02, 34 %, 11 %, 32510 MiB, 30123 MiB, 2387 MiB 2022/05/15 01:58:44.566, Tesla V100-SXM2-32GB, 470.57.02, 0 %, 0 %, 32510 MiB, 29931 MiB, 2579 MiB 2022/05/15 01:58:44.568, Tesla V100-SXM2-32GB, 470.57.02, 34 %, 11 %, 32510 MiB, 30123 MiB, 2387 MiB 2022/05/15 01:58:44.571, Tesla V100-SXM2-32GB, 470.57.02, 34 %, 11 %, 32510 MiB, 30123 MiB, 2387 MiB 2022/05/15 01:58:44.575, Tesla V100-SXM2-32GB, 470.57.02, 34 %, 11 %, 32510 MiB, 30123 MiB, 2387 MiB [rank:0] iter: 200/1100, loss: 0.0585128739476204, latency(ms): 14.8708538338541985 | 2022-05-15 01:58:45.806 [rank:0] iter: 300/1100, loss: 0.0577624365687370, latency(ms): 11.8026014044880867 | 2022-05-15 01:58:46.987 [rank:0] iter: 400/1100, loss: 0.0573879443109035, latency(ms): 11.9052816182374954 | 2022-05-15 01:58:48.177 [rank:0] iter: 500/1100, loss: 0.0571240074932575, latency(ms): 12.0105894654989243 | 2022-05-15 01:58:49.378 [rank:0] iter: 600/1100, loss: 0.0565957911312580, latency(ms): 11.9691264629364014 | 2022-05-15 01:58:50.575 [rank:0] iter: 700/1100, loss: 0.0558825358748436, latency(ms): 11.5400382876396179 | 2022-05-15 01:58:51.729 [rank:0] iter: 800/1100, loss: 0.0558075606822968, latency(ms): 11.8978261947631836 | 2022-05-15 01:58:52.919 [rank:0] iter: 900/1100, loss: 0.0557142049074173, latency(ms): 11.8812283128499985 | 2022-05-15 01:58:54.107 [rank:0] iter: 1000/1100, loss: 0.0555174350738525, latency(ms): 11.8253543600440025 | 2022-05-15 01:58:55.289 [rank:0] iter: 1100/1100, loss: 0.0557172931730747, latency(ms): 11.6677984595298767 | 2022-05-15 01:58:56.456