eval_loss = 0.6492512822151184 f1_score = 0.6030478301397648 f1_score_strict = 0.6219198790627363 precision = 0.5892312973009175 precision_strict = 0.6708298465373937 recall = 0.6194796608896835 recall_strict = 0.5840556028758207