eval_loss = 1.9889091809034902 perplexity = tensor(7.3076)