eval_loss = 4.1149924498684 perplexity = tensor(61.2518)