eval_loss = 1.283639632165432 perplexity = tensor(3.6098)