eval_loss = 0.20749381397451674 f1_score = 0.6845588961701847 precision = 0.6727508090614887 recall = 0.6967888985720989