correct = 3472 eval_loss = -12.407477678571428 incorrect = 361 similar = 8120