TrainOutput(global_step=21, training_loss=0.4915756980578105, metrics={'train_runtime': 192.3639, 'train_samples_per_second': 0.437, 'train_steps_per_second': 0.109, 'total_flos': 666298165708800.0, 'train_loss': 0.4915756980578105, 'epoch': 0.01})