Skip to content

Commit 21cfc20

Browse files
committed
Update models.yaml
1 parent 73f7883 commit 21cfc20

File tree

1 file changed

+2
-17
lines changed

1 file changed

+2
-17
lines changed

vec_inf/config/models.yaml

Lines changed: 2 additions & 17 deletions
Original file line numberDiff line numberDiff line change
@@ -1,19 +1,4 @@
11
models:
2-
c4ai-command-r-plus:
3-
model_family: c4ai-command-r
4-
model_variant: plus
5-
model_type: LLM
6-
gpus_per_node: 4
7-
num_nodes: 2
8-
vocab_size: 256000
9-
qos: m2
10-
time: 08:00:00
11-
partition: a40
12-
vllm_args:
13-
--pipeline-parallel-size: 2
14-
--tensor-parallel-size: 4
15-
--max-model-len: 8192
16-
--max-num-seqs: 256
172
c4ai-command-r-plus-08-2024:
183
model_family: c4ai-command-r
194
model_variant: plus-08-2024
@@ -989,9 +974,9 @@ models:
989974
--max-model-len: 4096
990975
--max-num-seqs: 256
991976
--compilation-config: 3
992-
QwQ-32B-Preview:
977+
QwQ-32B:
993978
model_family: QwQ
994-
model_variant: 32B-Preview
979+
model_variant: 32B
995980
model_type: LLM
996981
gpus_per_node: 2
997982
num_nodes: 1

0 commit comments

Comments
 (0)