@@ -424,6 +424,7 @@ class MODEL_ARCH(IntEnum):
424424 SEED_OSS = auto ()
425425 GROVEMOE = auto ()
426426 APERTUS = auto ()
427+ COGVLM = auto ()
427428
428429
429430class VISION_PROJECTOR_TYPE (IntEnum ):
@@ -435,6 +436,7 @@ class VISION_PROJECTOR_TYPE(IntEnum):
435436 MERGER = auto ()
436437 GEMMA3 = auto ()
437438 QWEN3VL = auto ()
439+ COGVLM = auto ()
438440
439441
440442class MODEL_TENSOR (IntEnum ):
@@ -605,6 +607,11 @@ class MODEL_TENSOR(IntEnum):
605607 SHORTCONV_CONV = auto ()
606608 SHORTCONV_INPROJ = auto ()
607609 SHORTCONV_OUTPROJ = auto ()
610+ VISEXP_ATTN_QKV = auto ()
611+ VISEXP_ATTN_OUT = auto ()
612+ VISEXP_GATE = auto ()
613+ VISEXP_DOWN = auto ()
614+ VISEXP_UP = auto ()
608615 # vision
609616 V_MMPROJ = auto ()
610617 V_MMPROJ_FC = auto ()
@@ -649,6 +656,12 @@ class MODEL_TENSOR(IntEnum):
649656 V_DS_NORM = auto () # qwen3vl
650657 V_DS_FC1 = auto () # qwen3vl
651658 V_DS_FC2 = auto () # qwen3vl
659+ V_MM_POST_FC_NORM = auto () # cogvlm
660+ V_MM_UP = auto () # cogvlm
661+ V_MM_DOWN = auto () # cogvlm
662+ V_MM_GATE = auto () # cogvlm
663+ V_TOK_BOI = auto () # cogvlm
664+ V_TOK_EOI = auto () # cogvlm
652665 # audio (mtmd)
653666 A_ENC_EMBD_POS = auto ()
654667 A_ENC_CONV1D = auto ()
@@ -777,6 +790,7 @@ class MODEL_TENSOR(IntEnum):
777790 MODEL_ARCH .SEED_OSS : "seed_oss" ,
778791 MODEL_ARCH .GROVEMOE : "grovemoe" ,
779792 MODEL_ARCH .APERTUS : "apertus" ,
793+ MODEL_ARCH .COGVLM : "cogvlm" ,
780794}
781795
782796VISION_PROJECTOR_TYPE_NAMES : dict [VISION_PROJECTOR_TYPE , str ] = {
@@ -957,6 +971,11 @@ class MODEL_TENSOR(IntEnum):
957971 MODEL_TENSOR .SHORTCONV_CONV : "blk.{bid}.shortconv.conv" ,
958972 MODEL_TENSOR .SHORTCONV_INPROJ : "blk.{bid}.shortconv.in_proj" ,
959973 MODEL_TENSOR .SHORTCONV_OUTPROJ : "blk.{bid}.shortconv.out_proj" ,
974+ MODEL_TENSOR .VISEXP_ATTN_QKV : "blk.{bid}.vis_attn_qkv" ,
975+ MODEL_TENSOR .VISEXP_ATTN_OUT : "blk.{bid}.vis_attn_output" ,
976+ MODEL_TENSOR .VISEXP_GATE : "blk.{bid}.vis_gate" ,
977+ MODEL_TENSOR .VISEXP_DOWN : "blk.{bid}.vis_down" ,
978+ MODEL_TENSOR .VISEXP_UP : "blk.{bid}.vis_up" ,
960979 # vision
961980 MODEL_TENSOR .V_MMPROJ : "mm.{bid}" ,
962981 MODEL_TENSOR .V_MMPROJ_FC : "mm.model.fc" ,
@@ -1001,6 +1020,12 @@ class MODEL_TENSOR(IntEnum):
10011020 MODEL_TENSOR .V_DS_NORM : "v.deepstack.{bid}.norm" ,
10021021 MODEL_TENSOR .V_DS_FC1 : "v.deepstack.{bid}.fc1" ,
10031022 MODEL_TENSOR .V_DS_FC2 : "v.deepstack.{bid}.fc2" ,
1023+ MODEL_TENSOR .V_MM_POST_FC_NORM : "mm.post_fc_norm" , # cogvlm
1024+ MODEL_TENSOR .V_MM_UP : "mm.up" ,
1025+ MODEL_TENSOR .V_MM_DOWN : "mm.down" ,
1026+ MODEL_TENSOR .V_MM_GATE : "mm.gate" ,
1027+ MODEL_TENSOR .V_TOK_BOI : "v.boi" ,
1028+ MODEL_TENSOR .V_TOK_EOI : "v.eoi" ,
10041029 # audio (mtmd)
10051030 MODEL_TENSOR .A_ENC_EMBD_POS : "a.position_embd" ,
10061031 MODEL_TENSOR .A_ENC_CONV1D : "a.conv1d.{bid}" ,
@@ -1073,6 +1098,12 @@ class MODEL_TENSOR(IntEnum):
10731098 MODEL_TENSOR .V_DS_NORM ,
10741099 MODEL_TENSOR .V_DS_FC1 ,
10751100 MODEL_TENSOR .V_DS_FC2 ,
1101+ MODEL_TENSOR .V_MM_POST_FC_NORM ,
1102+ MODEL_TENSOR .V_MM_UP ,
1103+ MODEL_TENSOR .V_MM_DOWN ,
1104+ MODEL_TENSOR .V_MM_GATE ,
1105+ MODEL_TENSOR .V_TOK_BOI ,
1106+ MODEL_TENSOR .V_TOK_EOI ,
10761107 # audio
10771108 MODEL_TENSOR .A_ENC_EMBD_POS ,
10781109 MODEL_TENSOR .A_ENC_CONV1D ,
@@ -2890,6 +2921,23 @@ class MODEL_TENSOR(IntEnum):
28902921 MODEL_TENSOR .FFN_DOWN_CHEXP ,
28912922 MODEL_TENSOR .FFN_UP_CHEXP ,
28922923 ],
2924+ MODEL_ARCH .COGVLM : [
2925+ MODEL_TENSOR .TOKEN_EMBD ,
2926+ MODEL_TENSOR .OUTPUT_NORM ,
2927+ MODEL_TENSOR .OUTPUT ,
2928+ MODEL_TENSOR .ATTN_NORM ,
2929+ MODEL_TENSOR .ATTN_QKV ,
2930+ MODEL_TENSOR .ATTN_OUT ,
2931+ MODEL_TENSOR .FFN_NORM ,
2932+ MODEL_TENSOR .FFN_GATE ,
2933+ MODEL_TENSOR .FFN_DOWN ,
2934+ MODEL_TENSOR .FFN_UP ,
2935+ MODEL_TENSOR .VISEXP_ATTN_QKV ,
2936+ MODEL_TENSOR .VISEXP_ATTN_OUT ,
2937+ MODEL_TENSOR .VISEXP_GATE ,
2938+ MODEL_TENSOR .VISEXP_UP ,
2939+ MODEL_TENSOR .VISEXP_DOWN ,
2940+ ],
28932941 # TODO
28942942}
28952943
@@ -3117,6 +3165,7 @@ class VisionProjectorType:
31173165 LFM2 = "lfm2"
31183166 KIMIVL = "kimivl"
31193167 LIGHTONOCR = "lightonocr"
3168+ COGVLM = "cogvlm"
31203169
31213170
31223171# Items here are (block size, type size)
0 commit comments