af631bd c73918c af631bd c73918c
1
2
3
4
5
6
7
8
model =gpt2 total batch size=40 train num epochs=3 fp16 =True max seq length =40 eval_acc = 0.7935483870967742 eval_loss = 0.5006362595865803