Upload README.md with huggingface_hub
Browse files
README.md
CHANGED
|
@@ -31,7 +31,7 @@ z-lab/Llama-3.1-8B-Instruct-PARO is a 4-bit [meta-llama/Llama-3.1-8B-Instruct](h
|
|
| 31 |
pip install "paroquant[vllm]"
|
| 32 |
|
| 33 |
# NVIDIA GPU (CUDA 13.0)
|
| 34 |
-
pip install "paroquant[vllm] vllm==0.17.1" \
|
| 35 |
--extra-index-url https://wheels.vllm.ai/0.17.1/cu130 \
|
| 36 |
--extra-index-url https://download.pytorch.org/whl/cu130
|
| 37 |
|
|
|
|
| 31 |
pip install "paroquant[vllm]"
|
| 32 |
|
| 33 |
# NVIDIA GPU (CUDA 13.0)
|
| 34 |
+
pip install "paroquant[vllm]" "vllm==0.17.1" \
|
| 35 |
--extra-index-url https://wheels.vllm.ai/0.17.1/cu130 \
|
| 36 |
--extra-index-url https://download.pytorch.org/whl/cu130
|
| 37 |
|