before_init_mem_cpu = 1314717696 before_init_mem_gpu = 0 epoch = 6.0 init_mem_cpu_alloc_delta = 880553984 init_mem_cpu_peaked_delta = 93917184 init_mem_gpu_alloc_delta = 443396608 init_mem_gpu_peaked_delta = 0 train_loss = 0.8106447110522921 train_mem_cpu_alloc_delta = 31978672128 train_mem_cpu_peaked_delta = 500772864 train_mem_gpu_alloc_delta = 1348273664 train_mem_gpu_peaked_delta = 64082841600 train_runtime = 71211.051 train_samples_per_second = 1017.691 train_steps_per_second = 1.325