@@ -6005,6 +6005,7 @@ def modify_tensors(self, data_torch: Tensor, name: str, bid: int | None) -> Iter
60056005
60066006 return [] # skip other tensors
60076007
6008+
60086009@ModelBase .register ("DeepseekOCRForCausalLM" )
60096010class DeepseekOCRVisionModel (MmprojModel ):
60106011 def set_gguf_parameters (self ):
@@ -6044,7 +6045,6 @@ def get_vision_config(self) -> dict[str, Any]:
60446045
60456046 return vision_config
60466047
6047-
60486048 def tensor_force_quant (self , name , new_name , bid , n_dims ):
60496049 # TODO: increase numercial stability. maybe delete later.
60506050 return gguf .GGMLQuantizationType .F32
@@ -7244,7 +7244,7 @@ class DeepseekV2Model(TextModel):
72447244 def __init__ (self , * args , ** kwargs ):
72457245 super ().__init__ (* args , ** kwargs )
72467246 vision_config = self .hparams .get ('vision_config' , {}).get ('width' , {})
7247-
7247+
72487248 if 'clip-l-14-224' in vision_config and 'sam_vit_b' in vision_config :
72497249 self .model_arch = gguf .MODEL_ARCH .DEEPSEEK2OCR
72507250 self .gguf_writer .arch = gguf .MODEL_ARCH_NAMES [self .model_arch ]
@@ -7354,8 +7354,12 @@ def set_gguf_parameters(self):
73547354
73557355 def modify_tensors (self , data_torch : Tensor , name : str , bid : int | None ) -> Iterable [tuple [str , Tensor ]]:
73567356 # skip vision tensors and remove "language_model." for Kimi-VL
7357- if "vision_" in name or "multi_modal_projector" in name \
7358- or "image_newline" in name or "model.projector" in name or "sam_model" in name or "view_seperator" in name :
7357+ if ("vision_" in name
7358+ or "multi_modal_projector" in name
7359+ or "image_newline" in name
7360+ or "model.projector" in name
7361+ or "sam_model" in name
7362+ or "view_seperator" in name ):
73597363 return []
73607364
73617365 if name .startswith ("language_model." ):
@@ -7435,6 +7439,7 @@ def prepare_tensors(self):
74357439 if len (experts ) > 0 :
74367440 raise ValueError (f"Unprocessed experts: { experts } " )
74377441
7442+
74387443@ModelBase .register ("MiniMaxM2ForCausalLM" )
74397444class MiniMaxM2Model (TextModel ):
74407445 model_arch = gguf .MODEL_ARCH .MINIMAXM2
0 commit comments