eval_loss = 3.159255956494531 perplexity = tensor(23.5531)