@@ -1179,6 +1179,7 @@ class TensorNameMap:
11791179 MODEL_TENSOR .V_MMPROJ_FC : (
11801180 "model.connector.modality_projection.proj" , # SmolVLM
11811181 "model.vision.linear_proj.linear_proj" , # cogvlm
1182+ "model.projector.layers" , # Deepseek-OCR
11821183 ),
11831184
11841185 MODEL_TENSOR .V_MMPROJ_MLP : (
@@ -1197,6 +1198,7 @@ class TensorNameMap:
11971198 "model.vision_tower.embeddings.cls_token" , # Intern-S1
11981199 "vision_model.class_embedding" , # llama 4
11991200 "model.vision.patch_embedding.cls_embedding" , # cogvlm
1201+ "model.vision_model.embeddings.class_embedding" , # Deepseek-OCR
12001202 ),
12011203
12021204 MODEL_TENSOR .V_ENC_EMBD_PATCH : (
@@ -1210,6 +1212,7 @@ class TensorNameMap:
12101212 "visual.patch_embed.proj" , # qwen2vl
12111213 "vision_tower.patch_embed.proj" , # kimi-vl
12121214 "model.vision.patch_embedding.proj" , # cogvlm
1215+ "model.vision_model.embeddings.patch_embedding" , # Deepseek-OCR CLIP
12131216 ),
12141217
12151218 MODEL_TENSOR .V_ENC_EMBD_POS : (
@@ -1222,10 +1225,19 @@ class TensorNameMap:
12221225 "visual.pos_embed" , # qwen3vl
12231226 "model.vision.patch_embedding.position_embedding" , # cogvlm
12241227 ),
1228+
1229+ MODEL_TENSOR .V_ENC_EMBD_IMGNL : (
1230+ "model.image_newline" , # Deepseek-OCR
1231+ ),
1232+
1233+ MODEL_TENSOR .V_ENC_EMBD_VSEP : (
1234+ "model.view_seperator" , # Deepseek-OCR
1235+ ),
12251236
12261237 MODEL_TENSOR .V_ENC_ATTN_QKV : (
12271238 "visual.blocks.{bid}.attn.qkv" , # qwen3vl
12281239 "model.vision.transformer.layers.{bid}.attention.query_key_value" , # cogvlm
1240+ "model.vision_model.transformer.layers.{bid}.self_attn.qkv_proj" , # Deepseek-OCR CLIP
12291241 ),
12301242
12311243 MODEL_TENSOR .V_ENC_ATTN_Q : (
@@ -1238,6 +1250,7 @@ class TensorNameMap:
12381250 "vision_encoder.transformer.layers.{bid}.attention.wq" , # pixtral
12391251 "visual.blocks.{bid}.attn.q" , # qwen2vl, generated
12401252 "vision_tower.encoder.blocks.{bid}.wq" , # kimi-vl, generated
1253+ "model.vision_model.transformer.layers.{bid}.self_attn.q_proj" , # Deepseek-OCR CLIP, generated
12411254 ),
12421255
12431256 MODEL_TENSOR .V_ENC_ATTN_Q_NORM : (
@@ -1255,6 +1268,7 @@ class TensorNameMap:
12551268 "vision_encoder.transformer.layers.{bid}.attention.wk" , # pixtral
12561269 "visual.blocks.{bid}.attn.k" , # qwen2vl, generated
12571270 "vision_tower.encoder.blocks.{bid}.wk" , # kimi-vl, generated
1271+ "model.vision_model.transformer.layers.{bid}.self_attn.k_proj" , # Deepseek-OCR CLIP, generated
12581272 ),
12591273
12601274 MODEL_TENSOR .V_ENC_ATTN_K_NORM : (
@@ -1272,6 +1286,7 @@ class TensorNameMap:
12721286 "vision_encoder.transformer.layers.{bid}.attention.wv" , # pixtral
12731287 "visual.blocks.{bid}.attn.v" , # qwen2vl, generated
12741288 "vision_tower.encoder.blocks.{bid}.wv" , # kimi-vl, generated
1289+ "model.vision_model.transformer.layers.{bid}.self_attn.v_proj" , # Deepseek-OCR CLIP, generated
12751290 ),
12761291
12771292 MODEL_TENSOR .V_ENC_INPUT_NORM : (
@@ -1286,6 +1301,7 @@ class TensorNameMap:
12861301 "visual.blocks.{bid}.norm1" , # qwen2vl
12871302 "vision_tower.encoder.blocks.{bid}.norm0" , # kimi-vl (norm0/norm1)
12881303 "model.vision.transformer.layers.{bid}.input_layernorm" , # cogvlm
1304+ "model.vision_model.transformer.layers.{bid}.layer_norm1" , # Deepseek-OCR CLIP
12891305 ),
12901306
12911307 MODEL_TENSOR .V_ENC_ATTN_O : (
@@ -1301,6 +1317,7 @@ class TensorNameMap:
13011317 "visual.blocks.{bid}.attn.proj" , # qwen2vl
13021318 "vision_tower.encoder.blocks.{bid}.wo" , # kimi-vl
13031319 "model.vision.transformer.layers.{bid}.attention.dense" , # cogvlm
1320+ "model.vision_model.transformer.layers.{bid}.self_attn.out_proj" , # Deepseek-OCR CLIP
13041321 ),
13051322
13061323 MODEL_TENSOR .V_ENC_POST_ATTN_NORM : (
@@ -1315,6 +1332,7 @@ class TensorNameMap:
13151332 "visual.blocks.{bid}.norm2" , # qwen2vl
13161333 "vision_tower.encoder.blocks.{bid}.norm1" , # kimi-vl (norm0/norm1)
13171334 "model.vision.transformer.layers.{bid}.post_attention_layernorm" , # cogvlm
1335+ "model.vision_model.transformer.layers.{bid}.layer_norm2" , # Deepseek-OCR CLIP
13181336 ),
13191337
13201338 MODEL_TENSOR .V_ENC_FFN_UP : (
@@ -1329,6 +1347,7 @@ class TensorNameMap:
13291347 "visual.blocks.{bid}.mlp.up_proj" , # qwen2.5vl
13301348 "visual.blocks.{bid}.mlp.linear_fc1" , # qwen3vl
13311349 "vision_tower.encoder.blocks.{bid}.mlp.fc0" , # kimi-vl (fc0/fc1)
1350+ "model.vision_model.transformer.layers.{bid}.mlp.fc1" , # Deepseek-OCR CLIP
13321351 "model.vision.transformer.layers.{bid}.mlp.fc1" , # cogvlm
13331352 ),
13341353
@@ -1351,6 +1370,7 @@ class TensorNameMap:
13511370 "visual.blocks.{bid}.mlp.linear_fc2" , # qwen3vl
13521371 "vision_tower.encoder.blocks.{bid}.mlp.fc1" , # kimi-vl (fc0/fc1)
13531372 "model.vision.transformer.layers.{bid}.mlp.fc2" , # cogvlm
1373+ "model.vision_model.transformer.layers.{bid}.mlp.fc2" , # Deepseek-OCR CLIP
13541374 ),
13551375
13561376 MODEL_TENSOR .V_LAYER_SCALE_1 : (
@@ -1368,6 +1388,7 @@ class TensorNameMap:
13681388 "vision_tower.ln_pre" , # pixtral-hf
13691389 "vision_encoder.ln_pre" , # pixtral
13701390 "vision_model.layernorm_pre" , # llama4
1391+ "model.vision_model.pre_layrnorm" , # Deepseek-OCR CLIP
13711392 ),
13721393
13731394 MODEL_TENSOR .V_POST_NORM : (
@@ -1460,11 +1481,11 @@ class TensorNameMap:
14601481 ),
14611482
14621483 MODEL_TENSOR .V_SAM_POS_EMBD : (
1463- "model.sam_model.pos_embed"
1484+ "model.sam_model.pos_embed" ,
14641485 ),
14651486
14661487 MODEL_TENSOR .V_SAM_PATCH_EMBD : (
1467- "model.sam_model.patch_embed.proj"
1488+ "model.sam_model.patch_embed.proj" ,
14681489 ),
14691490
14701491 MODEL_TENSOR .V_SAM_PRE_NORM : (
@@ -1476,19 +1497,19 @@ class TensorNameMap:
14761497 ),
14771498
14781499 MODEL_TENSOR .V_SAM_ATTN_POS_H : (
1479- "model.sam_model.blocks.{bid}.attn.rel_pos_h"
1500+ "model.sam_model.blocks.{bid}.attn.rel_pos_h" ,
14801501 ),
14811502
14821503 MODEL_TENSOR .V_SAM_ATTN_POS_W : (
1483- "model.sam_model.blocks.{bid}.attn.rel_pos_w"
1504+ "model.sam_model.blocks.{bid}.attn.rel_pos_w" ,
14841505 ),
14851506
14861507 MODEL_TENSOR .V_SAM_ATTN_QKV : (
1487- "model.sam_model.blocks.{bid}.attn.qkv"
1508+ "model.sam_model.blocks.{bid}.attn.qkv" ,
14881509 ),
14891510
14901511 MODEL_TENSOR .V_SAM_ATTN_OUT : (
1491- "model.sam_model.blocks.{bid}.attn.proj"
1512+ "model.sam_model.blocks.{bid}.attn.proj" ,
14921513 ),
14931514
14941515 MODEL_TENSOR .V_SAM_MLP_LIN_1 : (
@@ -1500,15 +1521,15 @@ class TensorNameMap:
15001521 ),
15011522
15021523 MODEL_TENSOR .V_SAM_NECK : (
1503- "model.sam_model.neck.{bid}"
1524+ "model.sam_model.neck.{bid}" ,
15041525 ),
15051526
15061527 MODEL_TENSOR .V_SAM_NET_2 : (
1507- "model.sam_model.net_2"
1528+ "model.sam_model.net_2" ,
15081529 ),
15091530
15101531 MODEL_TENSOR .V_SAM_NET_3 : (
1511- "model.sam_model.net_3"
1532+ "model.sam_model.net_3" ,
15121533 ),
15131534
15141535 MODEL_TENSOR .V_MM_POST_FC_NORM : (
0 commit comments