eval_loss = 2.243838704103647 perplexity = tensor(9.4295)