We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 07a4973 commit 75e0ae1Copy full SHA for 75e0ae1
vec_inf/client/_client_vars.py
@@ -78,7 +78,12 @@
78
VLLM_SHORT_TO_LONG_MAP = {
79
"-tp": "--tensor-parallel-size",
80
"-pp": "--pipeline-parallel-size",
81
+ "-dp": "--data-parallel-size",
82
+ "-dpl": "--data-parallel-size-local",
83
+ "-dpa": "--data-parallel-address",
84
+ "-dpp": "--data-parallel-rpc-port",
85
"-O": "--compilation-config",
86
+ "-q": "--quantization",
87
}
88
89
@@ -214,7 +219,7 @@ class SlurmScriptTemplate(TypedDict):
214
219
' && mv temp.json "$json_path"',
215
220
],
216
221
"launch_cmd": [
217
- "python3.10 -m vllm.entrypoints.openai.api_server \\",
222
+ "vllm serve \\",
218
223
" --model {model_weights_path} \\",
224
" --served-model-name {model_name} \\",
225
' --host "0.0.0.0" \\',
0 commit comments