eval_loss = 39.723388671875 perplexity = tensor(1.7850e+17)