mirror of https://github.com/THUDM/CodeGeeX.git
You cannot select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
48 lines
1.2 KiB
Bash
48 lines
1.2 KiB
Bash
# This script is used to test the inference of CodeGeeX.
|
|
|
|
MP_SIZE=$1
|
|
PROMPT_FILE=$2
|
|
|
|
SCRIPT_PATH=$(realpath "$0")
|
|
SCRIPT_DIR=$(dirname "$SCRIPT_PATH")
|
|
MAIN_DIR=$(dirname "$SCRIPT_DIR")
|
|
TOKENIZER_PATH="$MAIN_DIR/codegeex/tokenizer/"
|
|
|
|
if [ -z "$MP_SIZE" ]; then
|
|
MP_SIZE=1
|
|
fi
|
|
|
|
if [ "$MP_SIZE" -eq 1 ]; then
|
|
source "$MAIN_DIR/configs/codegeex_13b.sh"
|
|
echo "Load config from $MAIN_DIR/configs/codegeex_13b.sh"
|
|
else
|
|
source "$MAIN_DIR/configs/codegeex_13b_parallel.sh"
|
|
echo "Load config from $MAIN_DIR/configs/codegeex_13b_parallel.sh"
|
|
fi
|
|
|
|
# export CUDA settings
|
|
export CUDA_HOME=/usr/local/cuda-11.1/
|
|
# export CUDA_VISIBLE_DEVICES=0,1
|
|
|
|
if [ -z "$PROMPT_FILE" ]; then
|
|
PROMPT_FILE=$MAIN_DIR/tests/test_prompt.txt
|
|
fi
|
|
|
|
# remove --greedy if using sampling
|
|
CMD="torchrun --nproc_per_node $MP_SIZE $MAIN_DIR/tests/test_inference_megatron.py \
|
|
--tensor-model-parallel-size $MP_SIZE \
|
|
--prompt-file $PROMPT_FILE \
|
|
--tokenizer-path $TOKENIZER_PATH \
|
|
--micro-batch-size 1 \
|
|
--out-seq-length 1024 \
|
|
--temperature 0.8 \
|
|
--top-p 0.95 \
|
|
--top-k 0 \
|
|
--greedy \
|
|
--use-cpu-initialization \
|
|
--ln-fp16 \
|
|
$MODEL_ARGS"
|
|
|
|
echo "$CMD"
|
|
eval "$CMD"
|