Skip to content

Commit 1ffa83f

Browse files
committed
basic kimi-vl textmodel conversion
1 parent 5c0eb5e commit 1ffa83f

1 file changed

Lines changed: 8 additions & 0 deletions

File tree

convert_hf_to_gguf.py

Lines changed: 8 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -6059,6 +6059,7 @@ def prepare_tensors(self):
60596059

60606060
@ModelBase.register("DeepseekV2ForCausalLM")
60616061
@ModelBase.register("DeepseekV3ForCausalLM")
6062+
@ModelBase.register("KimiVLForConditionalGeneration")
60626063
class DeepseekV2Model(TextModel):
60636064
model_arch = gguf.MODEL_ARCH.DEEPSEEK2
60646065

@@ -6161,6 +6162,13 @@ def set_gguf_parameters(self):
61616162
_experts: list[dict[str, Tensor]] | None = None
61626163

61636164
def modify_tensors(self, data_torch: Tensor, name: str, bid: int | None) -> Iterable[tuple[str, Tensor]]:
6165+
# skip vision tensors and remove "language_model." for Kimi-VL
6166+
if "vision_tower" in name or "multi_modal_projector" in name:
6167+
return []
6168+
6169+
if name.startswith("language_model."):
6170+
name = name.replace("language_model.", "")
6171+
61646172
# rename e_score_correction_bias tensors
61656173
if name.endswith("e_score_correction_bias"):
61666174
name = name.replace("e_score_correction_bias", "e_score_correction.bias")

0 commit comments

Comments
 (0)