eval_loss = 5.804486441558424 perplexity = tensor(331.7847)