eval_loss = 2.8732976900107823 perplexity = tensor(17.6953)