eval_loss = 1.8874700883779576 perplexity = tensor(6.6026)