@@ -343,6 +343,7 @@ class MODEL_ARCH(IntEnum):
343343 WAVTOKENIZER_DEC = auto ()
344344 PLM = auto ()
345345 BAILINGMOE = auto ()
346+ DOTS1 = auto ()
346347
347348
348349class VISION_PROJECTOR_TYPE (IntEnum ):
@@ -623,6 +624,7 @@ class MODEL_TENSOR(IntEnum):
623624 MODEL_ARCH .WAVTOKENIZER_DEC : "wavtokenizer-dec" ,
624625 MODEL_ARCH .PLM : "plm" ,
625626 MODEL_ARCH .BAILINGMOE : "bailingmoe" ,
627+ MODEL_ARCH .DOTS1 : "dots1"
626628}
627629
628630VISION_PROJECTOR_TYPE_NAMES : dict [VISION_PROJECTOR_TYPE , str ] = {
@@ -2044,6 +2046,30 @@ class MODEL_TENSOR(IntEnum):
20442046 MODEL_TENSOR .FFN_DOWN_SHEXP ,
20452047 MODEL_TENSOR .FFN_UP_SHEXP ,
20462048 ],
2049+ MODEL_ARCH .DOTS1 : [
2050+ MODEL_TENSOR .TOKEN_EMBD ,
2051+ MODEL_TENSOR .OUTPUT_NORM ,
2052+ MODEL_TENSOR .OUTPUT ,
2053+ MODEL_TENSOR .ATTN_NORM ,
2054+ MODEL_TENSOR .ATTN_Q ,
2055+ MODEL_TENSOR .ATTN_Q_NORM ,
2056+ MODEL_TENSOR .ATTN_K ,
2057+ MODEL_TENSOR .ATTN_K_NORM ,
2058+ MODEL_TENSOR .ATTN_V ,
2059+ MODEL_TENSOR .ATTN_OUT ,
2060+ MODEL_TENSOR .FFN_EXP_PROBS_B ,
2061+ MODEL_TENSOR .FFN_NORM ,
2062+ MODEL_TENSOR .FFN_GATE ,
2063+ MODEL_TENSOR .FFN_GATE_EXP ,
2064+ MODEL_TENSOR .FFN_GATE_INP ,
2065+ MODEL_TENSOR .FFN_GATE_SHEXP ,
2066+ MODEL_TENSOR .FFN_DOWN ,
2067+ MODEL_TENSOR .FFN_DOWN_EXP ,
2068+ MODEL_TENSOR .FFN_DOWN_SHEXP ,
2069+ MODEL_TENSOR .FFN_UP ,
2070+ MODEL_TENSOR .FFN_UP_EXP ,
2071+ MODEL_TENSOR .FFN_UP_SHEXP ,
2072+ ],
20472073 # TODO
20482074}
20492075
0 commit comments