eval_loss = 4.131179701794618 perplexity = tensor(62.2513)