00000081
bash corex-docker-installer-4.1.2-10.2-ubuntu20.04-py3.10-x86_64.run
docker run -d --shm-size="32g" -it -v /usr/src:/usr/src -v /lib/modules:/lib/modules -v /dev:/dev -v /home:/home --name=test --privileged --cap-add=ALL --pid=host corex:4.1.2
docker exec -it test /bin/bash
cd /home
bash llm-inference-benchmark-corex-4.1.2.run
下载并解压数据集:
https://huggingface.co/datasets/THUDM/LongBench/resolve/main/data.zip
cp data.zip /home/llm-inference-benchmark/text-generation-inference
unzip data.zip
apt-get install git-lfs curl
git clone https://hf-mirror.com/THUDM/glm-4-9b
cd /home/llm-inference-benchmark/vllm/glm
bash test_glm.sh --num-prompts 1 --input-tokens 512 --output-tokens 512 --repeat-time 3 --model /home/glm-4-9b -tp 1 --max-num-seqs 1 --max-num-batched-tokens 20000 --max-model-len 2048 --trust-remote-code --distributed-executor-backend ray