| # SAT_HOME=/raid/dm/sat_models | |
| NLAYERS=48 | |
| NHIDDEN=2560 | |
| NATT=40 | |
| MAXSEQLEN=1089 | |
| MPSIZE=1 | |
| #SAMPLING ARGS | |
| # TEMP=1.03 | |
| TEMP=0.1 | |
| TOPK=200 | |
| export CUDA_VISIBLE_DEVICES=7 | |
| # SAT_HOME=$SAT_HOME \ | |
| python inference_mathglm.py \ | |
| --mode inference \ | |
| --distributed-backend nccl \ | |
| --max-sequence-length 512 \ | |
| --fp16 \ | |
| --model-parallel-size $MPSIZE \ | |
| --num-layers $NLAYERS \ | |
| --hidden-size $NHIDDEN \ | |
| --num-attention-heads $NATT \ | |
| --temperature $TEMP \ | |
| --top_k $TOPK \ | |
| --input-source ./input_test.txt \ | |
| --output-path samples_result \ | |
| --batch-size 1 \ | |
| --max-inference-batch-size 8 \ | |
| $@ | |