File tree Expand file tree Collapse file tree 2 files changed +5
-5
lines changed Expand file tree Collapse file tree 2 files changed +5
-5
lines changed Original file line number Diff line number Diff line change @@ -247,8 +247,8 @@ class MODEL_ARCH(IntEnum):
247247    OLMOE         =  auto ()
248248    OPENELM       =  auto ()
249249    ARCTIC        =  auto ()
250-     DEEPSEEK2     =  auto ()
251250    DEEPSEEK      =  auto ()
251+     DEEPSEEK2     =  auto ()
252252    CHATGLM       =  auto ()
253253    BITNET        =  auto ()
254254    T5            =  auto ()
@@ -410,8 +410,8 @@ class MODEL_TENSOR(IntEnum):
410410    MODEL_ARCH .OLMOE :          "olmoe" ,
411411    MODEL_ARCH .OPENELM :        "openelm" ,
412412    MODEL_ARCH .ARCTIC :         "arctic" ,
413-     MODEL_ARCH .DEEPSEEK2 :      "deepseek2" ,
414413    MODEL_ARCH .DEEPSEEK :       "deepseek" ,
414+     MODEL_ARCH .DEEPSEEK2 :      "deepseek2" ,
415415    MODEL_ARCH .CHATGLM :        "chatglm" ,
416416    MODEL_ARCH .BITNET :         "bitnet" ,
417417    MODEL_ARCH .T5 :             "t5" ,
Original file line number Diff line number Diff line change @@ -306,7 +306,7 @@ class TensorNameMap:
306306
307307        MODEL_TENSOR .FFN_UP_SHEXP : (
308308            "model.layers.{bid}.mlp.shared_expert.up_proj" ,  # qwen2moe 
309-             "model.layers.{bid}.mlp.shared_experts.up_proj" , # deepseek2 
309+             "model.layers.{bid}.mlp.shared_experts.up_proj" , # deepseek  deepseek2 
310310        ),
311311
312312        # AWQ-activation gate 
@@ -338,7 +338,7 @@ class TensorNameMap:
338338
339339        MODEL_TENSOR .FFN_GATE_SHEXP : (
340340            "model.layers.{bid}.mlp.shared_expert.gate_proj" ,  # qwen2moe 
341-             "model.layers.{bid}.mlp.shared_experts.gate_proj" , # deepseek2 
341+             "model.layers.{bid}.mlp.shared_experts.gate_proj" , # deepseek  deepseek2 
342342        ),
343343
344344        # Feed-forward down 
@@ -379,7 +379,7 @@ class TensorNameMap:
379379
380380        MODEL_TENSOR .FFN_DOWN_SHEXP : (
381381            "model.layers.{bid}.mlp.shared_expert.down_proj" ,  # qwen2moe 
382-             "model.layers.{bid}.mlp.shared_experts.down_proj" , # deepseek2 
382+             "model.layers.{bid}.mlp.shared_experts.down_proj" , # deepseek  deepseek2 
383383        ),
384384
385385        MODEL_TENSOR .ATTN_Q_NORM : (
 
 
   
 
     
   
   
          
    
    
     
    
      
     
     
    You can’t perform that action at this time.
  
 
    
  
    
      
        
     
       
      
     
   
 
    
    
  
 
  
 
     
    
0 commit comments