model =output_dir/new/goal_benchmark_roberta total batch size=8 train num epochs=3 fp16 =True max seq length =256 eval_acc = 0.7081148848871667 eval_loss = 0.5807009809192992