Skip to content

Commit 5d9c603

Browse files
committed
Updated max model length for text embedding models, update error handling for when errors that doesn't affect server launching show up in err logs
1 parent 5d580a0 commit 5d9c603

File tree

2 files changed

+6
-5
lines changed

2 files changed

+6
-5
lines changed

vec_inf/cli/_utils.py

Lines changed: 4 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -58,12 +58,13 @@ def is_server_running(
5858
if isinstance(log_content, str):
5959
return log_content
6060

61+
status = None
6162
for line in log_content:
6263
if "error" in line.lower():
63-
return ("FAILED", line.strip("\n"))
64+
status = ("FAILED", line.strip("\n"))
6465
if MODEL_READY_SIGNATURE in line:
65-
return "RUNNING"
66-
return "LAUNCHING"
66+
status = "RUNNING"
67+
return "LAUNCHING" if not status else status
6768

6869

6970
def get_base_url(slurm_job_name: str, slurm_job_id: int, log_dir: Optional[str]) -> str:

vec_inf/models/models.csv

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -63,5 +63,5 @@ Qwen2.5-14B-Instruct,Qwen2.5,14B-Instruct,LLM,a40,m2,08:00:00,1,1,152064,32768,a
6363
Qwen2.5-32B-Instruct,Qwen2.5,32B-Instruct,LLM,a40,m2,08:00:00,2,1,152064,32768,auto,singularity,default,true
6464
Qwen2.5-72B-Instruct,Qwen2.5,72B-Instruct,LLM,a40,m2,08:00:00,4,1,152064,32768,auto,singularity,default,true
6565
Pixtral-12B-2409,Pixtral,12B-2409,VLM,a40,m2,08:00:00,1,1,131072,16384,auto,singularity,default,true
66-
bge-multilingual-gemma2,bge,multilingual-gemma2,Text Embedding,a40,m2,08:00:00,1,1,256002,8192,auto,singularity,default,true
67-
e5-mistral-7b-instruct,e5,mistral-7b-instruct,Text Embedding,a40,m2,08:00:00,1,1,32000,32768,auto,singularity,default,true
66+
bge-multilingual-gemma2,bge,multilingual-gemma2,Text Embedding,a40,m2,08:00:00,1,1,256002,4096,auto,singularity,default,true
67+
e5-mistral-7b-instruct,e5,mistral-7b-instruct,Text Embedding,a40,m2,08:00:00,1,1,32000,4096,auto,singularity,default,true

0 commit comments

Comments
 (0)