File tree Expand file tree Collapse file tree 1 file changed +26
-0
lines changed Expand file tree Collapse file tree 1 file changed +26
-0
lines changed Original file line number Diff line number Diff line change @@ -301,6 +301,7 @@ class MODEL_ARCH(IntEnum):
301301 PHI3 = auto ()
302302 PHIMOE = auto ()
303303 PLAMO = auto ()
304+ PLAMO2 = auto ()
304305 CODESHELL = auto ()
305306 ORION = auto ()
306307 INTERNLM2 = auto ()
@@ -581,6 +582,7 @@ class MODEL_TENSOR(IntEnum):
581582 MODEL_ARCH .PHI3 : "phi3" ,
582583 MODEL_ARCH .PHIMOE : "phimoe" ,
583584 MODEL_ARCH .PLAMO : "plamo" ,
585+ MODEL_ARCH .PLAMO2 : "plamo2" ,
584586 MODEL_ARCH .CODESHELL : "codeshell" ,
585587 MODEL_ARCH .ORION : "orion" ,
586588 MODEL_ARCH .INTERNLM2 : "internlm2" ,
@@ -1272,6 +1274,30 @@ class MODEL_TENSOR(IntEnum):
12721274 MODEL_TENSOR .FFN_DOWN ,
12731275 MODEL_TENSOR .FFN_UP ,
12741276 ],
1277+ MODEL_ARCH .PLAMO2 : [
1278+ MODEL_TENSOR .TOKEN_EMBD ,
1279+ MODEL_TENSOR .OUTPUT_NORM ,
1280+ MODEL_TENSOR .OUTPUT ,
1281+ MODEL_TENSOR .ROPE_FREQS ,
1282+ MODEL_TENSOR .ATTN_NORM ,
1283+ MODEL_TENSOR .ATTN_Q ,
1284+ MODEL_TENSOR .ATTN_K ,
1285+ MODEL_TENSOR .ATTN_V ,
1286+ MODEL_TENSOR .ATTN_OUT ,
1287+ MODEL_TENSOR .ATTN_ROT_EMBD ,
1288+ MODEL_TENSOR .FFN_NORM ,
1289+ MODEL_TENSOR .FFN_GATE ,
1290+ MODEL_TENSOR .FFN_DOWN ,
1291+ MODEL_TENSOR .FFN_UP ,
1292+ # SSM/Mamba tensors for hybrid architecture
1293+ MODEL_TENSOR .SSM_IN ,
1294+ MODEL_TENSOR .SSM_CONV1D ,
1295+ MODEL_TENSOR .SSM_X ,
1296+ MODEL_TENSOR .SSM_DT ,
1297+ MODEL_TENSOR .SSM_A ,
1298+ MODEL_TENSOR .SSM_D ,
1299+ MODEL_TENSOR .SSM_OUT ,
1300+ ],
12751301 MODEL_ARCH .GPT2 : [
12761302 MODEL_TENSOR .TOKEN_EMBD ,
12771303 MODEL_TENSOR .POS_EMBD ,
You can’t perform that action at this time.
0 commit comments