|
1 | | -model_name,model_family,model_variant,model_type,partition,qos,time,num_gpus,num_nodes,vocab_size,max_model_len,data_type,venv,log_dir,pipeline_parallelism |
2 | | -c4ai-command-r-plus,c4ai-command-r,plus,LLM,a40,m2,08:00:00,4,2,256000,8192,auto,singularity,default,true |
3 | | -c4ai-command-r-plus-08-2024,c4ai-command-r,plus-08-2024,LLM,a40,m2,08:00:00,4,2,256000,65536,auto,singularity,default,true |
4 | | -c4ai-command-r-08-2024,c4ai-command-r,08-2024,LLM,a40,m2,08:00:00,2,1,256000,32768,auto,singularity,default,true |
5 | | -CodeLlama-7b-hf,CodeLlama,7b-hf,LLM,a40,m2,08:00:00,1,1,32000,16384,auto,singularity,default,true |
6 | | -CodeLlama-7b-Instruct-hf,CodeLlama,7b-Instruct-hf,LLM,a40,m2,08:00:00,1,1,32000,16384,auto,singularity,default,true |
7 | | -CodeLlama-13b-hf,CodeLlama,13b-hf,LLM,a40,m2,08:00:00,1,1,32000,16384,auto,singularity,default,true |
8 | | -CodeLlama-13b-Instruct-hf,CodeLlama,13b-Instruct-hf,LLM,a40,m2,08:00:00,1,1,32000,16384,auto,singularity,default,true |
9 | | -CodeLlama-34b-hf,CodeLlama,34b-hf,LLM,a40,m2,08:00:00,2,1,32000,16384,auto,singularity,default,true |
10 | | -CodeLlama-34b-Instruct-hf,CodeLlama,34b-Instruct-hf,LLM,a40,m2,08:00:00,2,1,32000,16384,auto,singularity,default,true |
11 | | -CodeLlama-70b-hf,CodeLlama,70b-hf,LLM,a40,m2,08:00:00,4,1,32000,4096,auto,singularity,default,true |
12 | | -CodeLlama-70b-Instruct-hf,CodeLlama,70b-Instruct-hf,LLM,a40,m2,08:00:00,4,1,32000,4096,auto,singularity,default,true |
13 | | -dbrx-instruct,dbrx,instruct,LLM,a40,m2,08:00:00,4,2,100352,32000,auto,singularity,default,true |
14 | | -gemma-2-9b,gemma-2,9b,LLM,a40,m2,08:00:00,1,1,256000,4096,auto,singularity,default,true |
15 | | -gemma-2-9b-it,gemma-2,9b-it,LLM,a40,m2,08:00:00,1,1,256000,4096,auto,singularity,default,true |
16 | | -gemma-2-27b,gemma-2,27b,LLM,a40,m2,08:00:00,2,1,256000,4096,auto,singularity,default,true |
17 | | -gemma-2-27b-it,gemma-2,27b-it,LLM,a40,m2,08:00:00,2,1,256000,4096,auto,singularity,default,true |
18 | | -Llama-2-7b-hf,Llama-2,7b-hf,LLM,a40,m2,08:00:00,1,1,32000,4096,auto,singularity,default,true |
19 | | -Llama-2-7b-chat-hf,Llama-2,7b-chat-hf,LLM,a40,m2,08:00:00,1,1,32000,4096,auto,singularity,default,true |
20 | | -Llama-2-13b-hf,Llama-2,13b-hf,LLM,a40,m2,08:00:00,1,1,32000,4096,auto,singularity,default,true |
21 | | -Llama-2-13b-chat-hf,Llama-2,13b-chat-hf,LLM,a40,m2,08:00:00,1,1,32000,4096,auto,singularity,default,true |
22 | | -Llama-2-70b-hf,Llama-2,70b-hf,LLM,a40,m2,08:00:00,4,1,32000,4096,auto,singularity,default,true |
23 | | -Llama-2-70b-chat-hf,Llama-2,70b-chat-hf,LLM,a40,m2,08:00:00,4,1,32000,4096,auto,singularity,default,true |
24 | | -llava-1.5-7b-hf,llava-1.5,7b-hf,VLM,a40,m2,08:00:00,1,1,32000,4096,auto,singularity,default,true |
25 | | -llava-1.5-13b-hf,llava-1.5,13b-hf,VLM,a40,m2,08:00:00,1,1,32000,4096,auto,singularity,default,true |
26 | | -llava-v1.6-mistral-7b-hf,llava-v1.6,mistral-7b-hf,VLM,a40,m2,08:00:00,1,1,32064,32768,auto,singularity,default,true |
27 | | -llava-v1.6-34b-hf,llava-v1.6,34b-hf,VLM,a40,m2,08:00:00,2,1,64064,4096,auto,singularity,default,true |
28 | | -Meta-Llama-3-8B,Meta-Llama-3,8B,LLM,a40,m2,08:00:00,1,1,128256,8192,auto,singularity,default,true |
29 | | -Meta-Llama-3-8B-Instruct,Meta-Llama-3,8B-Instruct,LLM,a40,m2,08:00:00,1,1,128256,8192,auto,singularity,default,true |
30 | | -Meta-Llama-3-70B,Meta-Llama-3,70B,LLM,a40,m2,08:00:00,4,1,128256,8192,auto,singularity,default,true |
31 | | -Meta-Llama-3-70B-Instruct,Meta-Llama-3,70B-Instruct,LLM,a40,m2,08:00:00,4,1,128256,8192,auto,singularity,default,true |
32 | | -Meta-Llama-3.1-8B,Meta-Llama-3.1,8B,LLM,a40,m2,08:00:00,1,1,128256,131072,auto,singularity,default,true |
33 | | -Meta-Llama-3.1-8B-Instruct,Meta-Llama-3.1,8B-Instruct,LLM,a40,m2,08:00:00,1,1,128256,131072,auto,singularity,default,true |
34 | | -Meta-Llama-3.1-70B,Meta-Llama-3.1,70B,LLM,a40,m2,08:00:00,4,1,128256,65536,auto,singularity,default,true |
35 | | -Meta-Llama-3.1-70B-Instruct,Meta-Llama-3.1,70B-Instruct,LLM,a40,m2,08:00:00,4,1,128256,65536,auto,singularity,default,true |
36 | | -Meta-Llama-3.1-405B-Instruct,Meta-Llama-3.1,405B-Instruct,LLM,a40,m4,02:00:00,4,8,128256,16384,auto,singularity,default,true |
37 | | -Mistral-7B-v0.1,Mistral,7B-v0.1,LLM,a40,m2,08:00:00,1,1,32000,32768,auto,singularity,default,true |
38 | | -Mistral-7B-Instruct-v0.1,Mistral,7B-Instruct-v0.1,LLM,a40,m2,08:00:00,1,1,32000,32768,auto,singularity,default,true |
39 | | -Mistral-7B-Instruct-v0.2,Mistral,7B-Instruct-v0.2,LLM,a40,m2,08:00:00,1,1,32000,32768,auto,singularity,default,true |
40 | | -Mistral-7B-v0.3,Mistral,7B-v0.3,LLM,a40,m2,08:00:00,1,1,32768,32768,auto,singularity,default,true |
41 | | -Mistral-7B-Instruct-v0.3,Mistral,7B-Instruct-v0.3,LLM,a40,m2,08:00:00,1,1,32768,32768,auto,singularity,default,true |
42 | | -Mistral-Large-Instruct-2407,Mistral,Large-Instruct-2407,LLM,a40,m2,08:00:00,4,2,32768,32768,auto,singularity,default,true |
43 | | -Mixtral-8x7B-Instruct-v0.1,Mixtral,8x7B-Instruct-v0.1,LLM,a40,m2,08:00:00,4,1,32000,32768,auto,singularity,default,true |
44 | | -Mixtral-8x22B-v0.1,Mixtral,8x22B-v0.1,LLM,a40,m2,08:00:00,4,2,32768,65536,auto,singularity,default,true |
45 | | -Mixtral-8x22B-Instruct-v0.1,Mixtral,8x22B-Instruct-v0.1,LLM,a40,m2,08:00:00,4,2,32768,65536,auto,singularity,default,true |
46 | | -Phi-3-medium-128k-instruct,Phi-3,medium-128k-instruct,LLM,a40,m2,08:00:00,2,1,32064,131072,auto,singularity,default,true |
47 | | -Phi-3-vision-128k-instruct,Phi-3,vision-128k-instruct,VLM,a40,m2,08:00:00,2,1,32064,65536,auto,singularity,default,true |
48 | | -Llama3-OpenBioLLM-70B,Llama3-OpenBioLLM,70B,LLM,a40,m2,08:00:00,4,1,128256,8192,auto,singularity,default,true |
49 | | -Llama-3.1-Nemotron-70B-Instruct-HF,Llama-3.1-Nemotron,70B-Instruct-HF,LLM,a40,m2,08:00:00,4,1,128256,65536,auto,singularity,default,true |
50 | | -Llama-3.2-1B,Llama-3.2,1B,LLM,a40,m2,08:00:00,1,1,128256,131072,auto,singularity,default,true |
51 | | -Llama-3.2-1B-Instruct,Llama-3.2,1B-Instruct,LLM,a40,m2,08:00:00,1,1,128256,131072,auto,singularity,default,true |
52 | | -Llama-3.2-3B,Llama-3.2,3B,LLM,a40,m2,08:00:00,1,1,128256,131072,auto,singularity,default,true |
53 | | -Llama-3.2-3B-Instruct,Llama-3.2,3B-Instruct,LLM,a40,m2,08:00:00,1,1,128256,131072,auto,singularity,default,true |
54 | | -Llama-3.2-11B-Vision,Llama-3.2,11B-Vision,VLM,a40,m2,08:00:00,1,1,128256,32768,auto,singularity,default,true |
55 | | -Llama-3.2-11B-Vision-Instruct,Llama-3.2,11B-Vision-Instruct,VLM,a40,m2,08:00:00,1,1,128256,32768,auto,singularity,default,true |
56 | | -Llama-3.2-90B-Vision,Llama-3.2,90B-Vision,VLM,a40,m2,08:00:00,4,2,128256,8192,auto,singularity,default,true |
57 | | -Llama-3.2-90B-Vision-Instruct,Llama-3.2,90B-Vision-Instruct,VLM,a40,m2,08:00:00,4,2,128256,8192,auto,singularity,default,true |
58 | | -Qwen2.5-0.5B-Instruct,Qwen2.5,0.5B-Instruct,LLM,a40,m2,08:00:00,1,1,152064,32768,auto,singularity,default,true |
59 | | -Qwen2.5-1.5B-Instruct,Qwen2.5,1.5B-Instruct,LLM,a40,m2,08:00:00,1,1,152064,32768,auto,singularity,default,true |
60 | | -Qwen2.5-3B-Instruct,Qwen2.5,3B-Instruct,LLM,a40,m2,08:00:00,1,1,152064,32768,auto,singularity,default,true |
61 | | -Qwen2.5-7B-Instruct,Qwen2.5,7B-Instruct,LLM,a40,m2,08:00:00,1,1,152064,32768,auto,singularity,default,true |
62 | | -Qwen2.5-14B-Instruct,Qwen2.5,14B-Instruct,LLM,a40,m2,08:00:00,1,1,152064,32768,auto,singularity,default,true |
63 | | -Qwen2.5-32B-Instruct,Qwen2.5,32B-Instruct,LLM,a40,m2,08:00:00,2,1,152064,32768,auto,singularity,default,true |
64 | | -Qwen2.5-72B-Instruct,Qwen2.5,72B-Instruct,LLM,a40,m2,08:00:00,4,1,152064,32768,auto,singularity,default,true |
65 | | -Pixtral-12B-2409,Pixtral,12B-2409,VLM,a40,m2,08:00:00,1,1,131072,16384,auto,singularity,default,true |
66 | | -bge-multilingual-gemma2,bge,multilingual-gemma2,Text Embedding,a40,m2,08:00:00,1,1,256002,4096,auto,singularity,default,true |
67 | | -e5-mistral-7b-instruct,e5,mistral-7b-instruct,Text Embedding,a40,m2,08:00:00,1,1,32000,4096,auto,singularity,default,true |
| 1 | +model_name,model_family,model_variant,model_type,num_gpus,num_nodes,vocab_size,max_model_len,max_num_seqs,pipeline_parallelism,qos,time,partition,data_type,venv,log_dir |
| 2 | +c4ai-command-r-plus,c4ai-command-r,plus,LLM,4,2,256000,8192,256,true,m2,08:00:00,a40,auto,singularity,default |
| 3 | +c4ai-command-r-plus-08-2024,c4ai-command-r,plus-08-2024,LLM,4,2,256000,65536,256,true,m2,08:00:00,a40,auto,singularity,default |
| 4 | +c4ai-command-r-08-2024,c4ai-command-r,08-2024,LLM,2,1,256000,32768,256,true,m2,08:00:00,a40,auto,singularity,default |
| 5 | +CodeLlama-7b-hf,CodeLlama,7b-hf,LLM,1,1,32000,16384,256,true,m2,08:00:00,a40,auto,singularity,default |
| 6 | +CodeLlama-7b-Instruct-hf,CodeLlama,7b-Instruct-hf,LLM,1,1,32000,16384,256,true,m2,08:00:00,a40,auto,singularity,default |
| 7 | +CodeLlama-13b-hf,CodeLlama,13b-hf,LLM,1,1,32000,16384,256,true,m2,08:00:00,a40,auto,singularity,default |
| 8 | +CodeLlama-13b-Instruct-hf,CodeLlama,13b-Instruct-hf,LLM,1,1,32000,16384,256,true,m2,08:00:00,a40,auto,singularity,default |
| 9 | +CodeLlama-34b-hf,CodeLlama,34b-hf,LLM,2,1,32000,16384,256,true,m2,08:00:00,a40,auto,singularity,default |
| 10 | +CodeLlama-34b-Instruct-hf,CodeLlama,34b-Instruct-hf,LLM,2,1,32000,16384,256,true,m2,08:00:00,a40,auto,singularity,default |
| 11 | +CodeLlama-70b-hf,CodeLlama,70b-hf,LLM,4,1,32000,4096,256,true,m2,08:00:00,a40,auto,singularity,default |
| 12 | +CodeLlama-70b-Instruct-hf,CodeLlama,70b-Instruct-hf,LLM,4,1,32000,4096,256,true,m2,08:00:00,a40,auto,singularity,default |
| 13 | +dbrx-instruct,dbrx,instruct,LLM,4,2,100352,32000,256,true,m2,08:00:00,a40,auto,singularity,default |
| 14 | +gemma-2-9b,gemma-2,9b,LLM,1,1,256000,4096,256,true,m2,08:00:00,a40,auto,singularity,default |
| 15 | +gemma-2-9b-it,gemma-2,9b-it,LLM,1,1,256000,4096,256,true,m2,08:00:00,a40,auto,singularity,default |
| 16 | +gemma-2-27b,gemma-2,27b,LLM,2,1,256000,4096,256,true,m2,08:00:00,a40,auto,singularity,default |
| 17 | +gemma-2-27b-it,gemma-2,27b-it,LLM,2,1,256000,4096,256,true,m2,08:00:00,a40,auto,singularity,default |
| 18 | +Llama-2-7b-hf,Llama-2,7b-hf,LLM,1,1,32000,4096,256,true,m2,08:00:00,a40,auto,singularity,default |
| 19 | +Llama-2-7b-chat-hf,Llama-2,7b-chat-hf,LLM,1,1,32000,4096,256,true,m2,08:00:00,a40,auto,singularity,default |
| 20 | +Llama-2-13b-hf,Llama-2,13b-hf,LLM,1,1,32000,4096,256,true,m2,08:00:00,a40,auto,singularity,default |
| 21 | +Llama-2-13b-chat-hf,Llama-2,13b-chat-hf,LLM,1,1,32000,4096,256,true,m2,08:00:00,a40,auto,singularity,default |
| 22 | +Llama-2-70b-hf,Llama-2,70b-hf,LLM,4,1,32000,4096,256,true,m2,08:00:00,a40,auto,singularity,default |
| 23 | +Llama-2-70b-chat-hf,Llama-2,70b-chat-hf,LLM,4,1,32000,4096,256,true,m2,08:00:00,a40,auto,singularity,default |
| 24 | +llava-1.5-7b-hf,llava-1.5,7b-hf,VLM,1,1,32000,4096,256,true,m2,08:00:00,a40,auto,singularity,default |
| 25 | +llava-1.5-13b-hf,llava-1.5,13b-hf,VLM,1,1,32000,4096,256,true,m2,08:00:00,a40,auto,singularity,default |
| 26 | +llava-v1.6-mistral-7b-hf,llava-v1.6,mistral-7b-hf,VLM,1,1,32064,32768,256,true,m2,08:00:00,a40,auto,singularity,default |
| 27 | +llava-v1.6-34b-hf,llava-v1.6,34b-hf,VLM,2,1,64064,4096,256,true,m2,08:00:00,a40,auto,singularity,default |
| 28 | +Meta-Llama-3-8B,Meta-Llama-3,8B,LLM,1,1,128256,8192,256,true,m2,08:00:00,a40,auto,singularity,default |
| 29 | +Meta-Llama-3-8B-Instruct,Meta-Llama-3,8B-Instruct,LLM,1,1,128256,8192,256,true,m2,08:00:00,a40,auto,singularity,default |
| 30 | +Meta-Llama-3-70B,Meta-Llama-3,70B,LLM,4,1,128256,8192,256,true,m2,08:00:00,a40,auto,singularity,default |
| 31 | +Meta-Llama-3-70B-Instruct,Meta-Llama-3,70B-Instruct,LLM,4,1,128256,8192,256,true,m2,08:00:00,a40,auto,singularity,default |
| 32 | +Meta-Llama-3.1-8B,Meta-Llama-3.1,8B,LLM,1,1,128256,131072,256,true,m2,08:00:00,a40,auto,singularity,default |
| 33 | +Meta-Llama-3.1-8B-Instruct,Meta-Llama-3.1,8B-Instruct,LLM,1,1,128256,131072,256,true,m2,08:00:00,a40,auto,singularity,default |
| 34 | +Meta-Llama-3.1-70B,Meta-Llama-3.1,70B,LLM,4,1,128256,65536,256,true,m2,08:00:00,a40,auto,singularity,default |
| 35 | +Meta-Llama-3.1-70B-Instruct,Meta-Llama-3.1,70B-Instruct,LLM,4,1,128256,65536,256,true,m2,08:00:00,a40,auto,singularity,default |
| 36 | +Meta-Llama-3.1-405B-Instruct,Meta-Llama-3.1,405B-Instruct,LLM,4,8,128256,16384,256,true,m4,02:00:00,a40,auto,singularity,default |
| 37 | +Mistral-7B-v0.1,Mistral,7B-v0.1,LLM,1,1,32000,32768,256,true,m2,08:00:00,a40,auto,singularity,default |
| 38 | +Mistral-7B-Instruct-v0.1,Mistral,7B-Instruct-v0.1,LLM,1,1,32000,32768,256,true,m2,08:00:00,a40,auto,singularity,default |
| 39 | +Mistral-7B-Instruct-v0.2,Mistral,7B-Instruct-v0.2,LLM,1,1,32000,32768,256,true,m2,08:00:00,a40,auto,singularity,default |
| 40 | +Mistral-7B-v0.3,Mistral,7B-v0.3,LLM,1,1,32768,32768,256,true,m2,08:00:00,a40,auto,singularity,default |
| 41 | +Mistral-7B-Instruct-v0.3,Mistral,7B-Instruct-v0.3,LLM,1,1,32768,32768,256,true,m2,08:00:00,a40,auto,singularity,default |
| 42 | +Mistral-Large-Instruct-2407,Mistral,Large-Instruct-2407,LLM,4,2,32768,32768,256,true,m2,08:00:00,a40,auto,singularity,default |
| 43 | +Mixtral-8x7B-Instruct-v0.1,Mixtral,8x7B-Instruct-v0.1,LLM,4,1,32000,32768,256,true,m2,08:00:00,a40,auto,singularity,default |
| 44 | +Mixtral-8x22B-v0.1,Mixtral,8x22B-v0.1,LLM,4,2,32768,65536,256,true,m2,08:00:00,a40,auto,singularity,default |
| 45 | +Mixtral-8x22B-Instruct-v0.1,Mixtral,8x22B-Instruct-v0.1,LLM,4,2,32768,65536,256,true,m2,08:00:00,a40,auto,singularity,default |
| 46 | +Phi-3-medium-128k-instruct,Phi-3,medium-128k-instruct,LLM,2,1,32064,131072,256,true,m2,08:00:00,a40,auto,singularity,default |
| 47 | +Phi-3-vision-128k-instruct,Phi-3,vision-128k-instruct,VLM,2,1,32064,65536,256,true,m2,08:00:00,a40,auto,singularity,default |
| 48 | +Llama3-OpenBioLLM-70B,Llama3-OpenBioLLM,70B,LLM,4,1,128256,8192,256,true,m2,08:00:00,a40,auto,singularity,default |
| 49 | +Llama-3.1-Nemotron-70B-Instruct-HF,Llama-3.1-Nemotron,70B-Instruct-HF,LLM,4,1,128256,65536,256,true,m2,08:00:00,a40,auto,singularity,default |
| 50 | +Llama-3.2-1B,Llama-3.2,1B,LLM,1,1,128256,131072,256,true,m2,08:00:00,a40,auto,singularity,default |
| 51 | +Llama-3.2-1B-Instruct,Llama-3.2,1B-Instruct,LLM,1,1,128256,131072,256,true,m2,08:00:00,a40,auto,singularity,default |
| 52 | +Llama-3.2-3B,Llama-3.2,3B,LLM,1,1,128256,131072,256,true,m2,08:00:00,a40,auto,singularity,default |
| 53 | +Llama-3.2-3B-Instruct,Llama-3.2,3B-Instruct,LLM,1,1,128256,131072,256,true,m2,08:00:00,a40,auto,singularity,default |
| 54 | +Llama-3.2-11B-Vision,Llama-3.2,11B-Vision,VLM,4,1,128256,4096,16,false,m2,08:00:00,a40,auto,singularity,default |
| 55 | +Llama-3.2-11B-Vision-Instruct,Llama-3.2,11B-Vision-Instruct,VLM,4,1,128256,4096,16,false,m2,08:00:00,a40,auto,singularity,default |
| 56 | +Llama-3.2-90B-Vision,Llama-3.2,90B-Vision,VLM,4,2,128256,4096,16,false,m2,08:00:00,a40,auto,singularity,default |
| 57 | +Llama-3.2-90B-Vision-Instruct,Llama-3.2,90B-Vision-Instruct,VLM,4,2,128256,4096,16,false,m2,08:00:00,a40,auto,singularity,default |
| 58 | +Qwen2.5-0.5B-Instruct,Qwen2.5,0.5B-Instruct,LLM,1,1,152064,32768,256,true,m2,08:00:00,a40,auto,singularity,default |
| 59 | +Qwen2.5-1.5B-Instruct,Qwen2.5,1.5B-Instruct,LLM,1,1,152064,32768,256,true,m2,08:00:00,a40,auto,singularity,default |
| 60 | +Qwen2.5-3B-Instruct,Qwen2.5,3B-Instruct,LLM,1,1,152064,32768,256,true,m2,08:00:00,a40,auto,singularity,default |
| 61 | +Qwen2.5-7B-Instruct,Qwen2.5,7B-Instruct,LLM,1,1,152064,32768,256,true,m2,08:00:00,a40,auto,singularity,default |
| 62 | +Qwen2.5-14B-Instruct,Qwen2.5,14B-Instruct,LLM,1,1,152064,32768,256,true,m2,08:00:00,a40,auto,singularity,default |
| 63 | +Qwen2.5-32B-Instruct,Qwen2.5,32B-Instruct,LLM,2,1,152064,32768,256,true,m2,08:00:00,a40,auto,singularity,default |
| 64 | +Qwen2.5-72B-Instruct,Qwen2.5,72B-Instruct,LLM,4,1,152064,16384,256,true,m2,08:00:00,a40,auto,singularity,default |
| 65 | +Pixtral-12B-2409,Pixtral,12B-2409,VLM,1,1,131072,8192,256,true,m2,08:00:00,a40,auto,singularity,default |
| 66 | +bge-multilingual-gemma2,bge,multilingual-gemma2,Text Embedding,1,1,256002,4096,256,true,m2,08:00:00,a40,auto,singularity,default |
| 67 | +e5-mistral-7b-instruct,e5,mistral-7b-instruct,Text Embedding,1,1,32000,4096,256,true,m2,08:00:00,a40,auto,singularity,default |
0 commit comments