eval_loss = 1.3889511987951484 perplexity = tensor(4.0106)