00000068
conda create --name myenv python=3.10
conda activate myenv
bash installwhl.sh /home/whl310
apt-get install git-lfs
git clone https://www.modelscope.cn/swift/Meta-Llama-3-8B-Instruct-GPTQ-Int8.git
python3 offline_inference.py --model /home/Meta-Llama-3-8B-Instruct-GPTQ-Int8 --quantization gptq -tp 1 --temperature 0.0
pip3 install vllm-0.5.4+corex.4.1.0.w2436-py3-none-any.whl
pip3 install ixformer-0.6.0+corex.4.1.0.w2436-cp310-cp310-linux_x86_64.whl
再次运行模型,没有乱码了
git clone https://hf-mirror.com/ranchlai/chatglm3-6B-gptq-4bit
python3 offline_inference.py --model /home/chatglm3-6B-gptq-4bit --quantization gptq -tp 1 --temperature 0.0 --trust-remote-code