correct = 4982 eval_loss = -6.908095015576605 incorrect = 1081 similar = 4507