eval_loss = 2.1579703759142412 perplexity = tensor(8.6536)