xFasterTransformer
xFasterTransformer copied to clipboard
chatglm3 6b error
bash ./run_benchmark.sh -m chatglm3-6b -d nf4 -s 1 -bs 1 -in 256 -out 256 -i 1 bash ./run_benchmark.sh -m chatglm3-6b -d int4 -s 1 -bs 1 -in 256 -out 256 -i 1 bash ./run_benchmark.sh -m chatglm3-6b -d bf16_nf4 -s 1 -bs 1 -in 256 -out 256 -i 1 bash ./run_benchmark.sh -m chatglm3-6b -d bf16_int4 -s 1 -bs 1 -in 256 -out 256 -i 1 bash ./run_benchmark.sh -m chatglm3-6b -d w8a8_nf4 -s 1 -bs 1 -in 256 -out 256 -i 1 bash ./run_benchmark.sh -m chatglm3-6b -d w8a8_int4 -s 1 -bs 1 -in 256 -out 256 -i 1
bash ./run_benchmark.sh -m chatglm3-6b -d bf16 -s 2 -bs 1 -in 256 -out 256 -i 1 bash ./run_benchmark.sh -m chatglm3-6b -d int8 -s 2 -bs 1 -in 256 -out 256 -i 1 bash ./run_benchmark.sh -m chatglm3-6b -d nf4 -s 2 -bs 1 -in 256 -out 256 -i 1 bash ./run_benchmark.sh -m chatglm3-6b -d bf16_fp16 -s 2 -bs 1 -in 256 -out 256 -i 1 bash ./run_benchmark.sh -m chatglm3-6b -d bf16_w8a8 -s 2 -bs 1 -in 256 -out 256 -i 1 bash ./run_benchmark.sh -m chatglm3-6b -d bf16_int8 -s 2 -bs 1 -in 256 -out 256 -i 1 bash ./run_benchmark.sh -m chatglm3-6b -d bf16_int4 -s 2 -bs 1 -in 256 -out 256 -i 1 bash ./run_benchmark.sh -m chatglm3-6b -d bf16_nf4 -s 2 -bs 1 -in 256 -out 256 -i 1