eval_loss = 4.334688968825758 perplexity = tensor(76.3012)