model =output_dir/new/order_benchmark_roberta total batch size=16 train num epochs=3 fp16 =False max seq length =80 eval_acc = 0.17775948788294468 eval_loss = 2.3591820047612777