Update README.md
Browse files
README.md
CHANGED
|
@@ -87,6 +87,7 @@ vllm serve inclusionAI/Ring-mini-linear-2.0-GPTQ-int4 \
|
|
| 87 |
--gpu-memory-utilization 0.90 \
|
| 88 |
--max-num-seqs 128 \
|
| 89 |
--no-enable-prefix-caching
|
|
|
|
| 90 |
```
|
| 91 |
|
| 92 |
|
|
|
|
| 87 |
--gpu-memory-utilization 0.90 \
|
| 88 |
--max-num-seqs 128 \
|
| 89 |
--no-enable-prefix-caching
|
| 90 |
+
--api-key your-api-key
|
| 91 |
```
|
| 92 |
|
| 93 |
|