eval_loss = 1.1680530061261 perplexity = tensor(3.2157)