#!/bin/bash # SAT_HOME=/raid/dm/sat_models NLAYERS=48 NHIDDEN=2560 NATT=40 MAXSEQLEN=1089 MPSIZE=1 #SAMPLING ARGS # TEMP=1.03 TEMP=0.1 TOPK=200 export CUDA_VISIBLE_DEVICES=7 # SAT_HOME=$SAT_HOME \ python inference_mathglm.py \ --mode inference \ --distributed-backend nccl \ --max-sequence-length 512 \ --fp16 \ --model-parallel-size $MPSIZE \ --num-layers $NLAYERS \ --hidden-size $NHIDDEN \ --num-attention-heads $NATT \ --temperature $TEMP \ --top_k $TOPK \ --input-source ./input_test.txt \ --output-path samples_result \ --batch-size 1 \ --max-inference-batch-size 8 \ $@