model =output_dir/new/step_benchmark_roberta total batch size=16 train num epochs=3 fp16 =False max seq length =80 eval_acc = 0.4882035389383185 eval_loss = 1.420818744946441