eval_loss = 2.8937215335580833 perplexity = tensor(18.0604)