# SAT_HOME=/raid/dm/sat_models | |
NLAYERS=48 | |
NHIDDEN=2560 | |
NATT=40 | |
MAXSEQLEN=1089 | |
MPSIZE=1 | |
#SAMPLING ARGS | |
# TEMP=1.03 | |
TEMP=0.1 | |
TOPK=200 | |
export CUDA_VISIBLE_DEVICES=7 | |
# SAT_HOME=$SAT_HOME \ | |
python inference_mathglm.py \ | |
--mode inference \ | |
--distributed-backend nccl \ | |
--max-sequence-length 512 \ | |
--fp16 \ | |
--model-parallel-size $MPSIZE \ | |
--num-layers $NLAYERS \ | |
--hidden-size $NHIDDEN \ | |
--num-attention-heads $NATT \ | |
--temperature $TEMP \ | |
--top_k $TOPK \ | |
--input-source ./input_test.txt \ | |
--output-path samples_result \ | |
--batch-size 1 \ | |
--max-inference-batch-size 8 \ | |
$@ | |