@@ -1368,6 +1368,7 @@ class MODEL_TENSOR(IntEnum):
13681368 MODEL_TENSOR .FFN_GATE_EXP ,
13691369 MODEL_TENSOR .FFN_DOWN_EXP ,
13701370 MODEL_TENSOR .FFN_UP_EXP ,
1371+ MODEL_TENSOR .FFN_GATE_UP_EXP ,
13711372 ],
13721373 MODEL_ARCH .LLAMA4 : [
13731374 MODEL_TENSOR .TOKEN_EMBD ,
@@ -1388,6 +1389,7 @@ class MODEL_TENSOR(IntEnum):
13881389 MODEL_TENSOR .FFN_GATE_EXP ,
13891390 MODEL_TENSOR .FFN_DOWN_EXP ,
13901391 MODEL_TENSOR .FFN_UP_EXP ,
1392+ MODEL_TENSOR .FFN_GATE_UP_EXP ,
13911393 MODEL_TENSOR .FFN_GATE_SHEXP ,
13921394 MODEL_TENSOR .FFN_DOWN_SHEXP ,
13931395 MODEL_TENSOR .FFN_UP_SHEXP ,
@@ -1411,6 +1413,7 @@ class MODEL_TENSOR(IntEnum):
14111413 MODEL_TENSOR .FFN_GATE_EXP ,
14121414 MODEL_TENSOR .FFN_DOWN_EXP ,
14131415 MODEL_TENSOR .FFN_UP_EXP ,
1416+ MODEL_TENSOR .FFN_GATE_UP_EXP ,
14141417 ],
14151418 MODEL_ARCH .GROK : [
14161419 MODEL_TENSOR .TOKEN_EMBD ,
@@ -1432,6 +1435,7 @@ class MODEL_TENSOR(IntEnum):
14321435 MODEL_TENSOR .FFN_GATE_EXP ,
14331436 MODEL_TENSOR .FFN_DOWN_EXP ,
14341437 MODEL_TENSOR .FFN_UP_EXP ,
1438+ MODEL_TENSOR .FFN_GATE_UP_EXP ,
14351439 MODEL_TENSOR .FFN_POST_NORM ,
14361440 MODEL_TENSOR .LAYER_OUT_NORM ,
14371441 ],
@@ -1746,6 +1750,7 @@ class MODEL_TENSOR(IntEnum):
17461750 MODEL_TENSOR .FFN_GATE_EXP ,
17471751 MODEL_TENSOR .FFN_DOWN_EXP ,
17481752 MODEL_TENSOR .FFN_UP_EXP ,
1753+ MODEL_TENSOR .FFN_GATE_UP_EXP ,
17491754 MODEL_TENSOR .FFN_GATE_INP_SHEXP ,
17501755 MODEL_TENSOR .FFN_GATE_SHEXP ,
17511756 MODEL_TENSOR .FFN_DOWN_SHEXP ,
@@ -1784,6 +1789,7 @@ class MODEL_TENSOR(IntEnum):
17841789 MODEL_TENSOR .FFN_GATE_EXP ,
17851790 MODEL_TENSOR .FFN_DOWN_EXP ,
17861791 MODEL_TENSOR .FFN_UP_EXP ,
1792+ MODEL_TENSOR .FFN_GATE_UP_EXP ,
17871793 ],
17881794 MODEL_ARCH .QWEN3NEXT : [
17891795 MODEL_TENSOR .TOKEN_EMBD ,
@@ -1807,6 +1813,7 @@ class MODEL_TENSOR(IntEnum):
18071813 MODEL_TENSOR .FFN_DOWN_EXP ,
18081814 MODEL_TENSOR .FFN_UP_EXP ,
18091815 MODEL_TENSOR .FFN_GATE_EXP ,
1816+ MODEL_TENSOR .FFN_GATE_UP_EXP ,
18101817 MODEL_TENSOR .SSM_A ,
18111818 MODEL_TENSOR .SSM_CONV1D ,
18121819 MODEL_TENSOR .SSM_DT ,
@@ -1848,6 +1855,7 @@ class MODEL_TENSOR(IntEnum):
18481855 MODEL_TENSOR .FFN_GATE_EXP ,
18491856 MODEL_TENSOR .FFN_DOWN_EXP ,
18501857 MODEL_TENSOR .FFN_UP_EXP ,
1858+ MODEL_TENSOR .FFN_GATE_UP_EXP ,
18511859 ],
18521860 MODEL_ARCH .QWEN35 : [
18531861 MODEL_TENSOR .TOKEN_EMBD ,
@@ -2023,6 +2031,7 @@ class MODEL_TENSOR(IntEnum):
20232031 MODEL_TENSOR .FFN_GATE_EXP ,
20242032 MODEL_TENSOR .FFN_DOWN_EXP ,
20252033 MODEL_TENSOR .FFN_UP_EXP ,
2034+ MODEL_TENSOR .FFN_GATE_UP_EXP ,
20262035 ],
20272036 MODEL_ARCH .CODESHELL : [
20282037 MODEL_TENSOR .TOKEN_EMBD ,
@@ -2089,6 +2098,7 @@ class MODEL_TENSOR(IntEnum):
20892098 MODEL_TENSOR .FFN_GATE_EXP ,
20902099 MODEL_TENSOR .FFN_DOWN_EXP ,
20912100 MODEL_TENSOR .FFN_UP_EXP ,
2101+ MODEL_TENSOR .FFN_GATE_UP_EXP ,
20922102 ],
20932103 MODEL_ARCH .MINICPM3 : [
20942104 MODEL_TENSOR .TOKEN_EMBD ,
@@ -2401,6 +2411,7 @@ class MODEL_TENSOR(IntEnum):
24012411 MODEL_TENSOR .FFN_GATE_EXP ,
24022412 MODEL_TENSOR .FFN_DOWN_EXP ,
24032413 MODEL_TENSOR .FFN_UP_EXP ,
2414+ MODEL_TENSOR .FFN_GATE_UP_EXP ,
24042415 ],
24052416 MODEL_ARCH .XVERSE : [
24062417 MODEL_TENSOR .TOKEN_EMBD ,
@@ -2456,6 +2467,7 @@ class MODEL_TENSOR(IntEnum):
24562467 MODEL_TENSOR .FFN_GATE_EXP ,
24572468 MODEL_TENSOR .FFN_DOWN_EXP ,
24582469 MODEL_TENSOR .FFN_UP_EXP ,
2470+ MODEL_TENSOR .FFN_GATE_UP_EXP ,
24592471 ],
24602472 MODEL_ARCH .OLMO : [
24612473 MODEL_TENSOR .TOKEN_EMBD ,
@@ -2514,6 +2526,7 @@ class MODEL_TENSOR(IntEnum):
25142526 MODEL_TENSOR .FFN_GATE_EXP ,
25152527 MODEL_TENSOR .FFN_UP_EXP ,
25162528 MODEL_TENSOR .FFN_DOWN_EXP ,
2529+ MODEL_TENSOR .FFN_GATE_UP_EXP ,
25172530 ],
25182531 MODEL_ARCH .OPENELM : [
25192532 MODEL_TENSOR .TOKEN_EMBD ,
@@ -2548,6 +2561,7 @@ class MODEL_TENSOR(IntEnum):
25482561 MODEL_TENSOR .FFN_GATE_EXP ,
25492562 MODEL_TENSOR .FFN_DOWN_EXP ,
25502563 MODEL_TENSOR .FFN_UP_EXP ,
2564+ MODEL_TENSOR .FFN_GATE_UP_EXP ,
25512565 ],
25522566 MODEL_ARCH .DEEPSEEK : [
25532567 MODEL_TENSOR .TOKEN_EMBD ,
@@ -2568,6 +2582,7 @@ class MODEL_TENSOR(IntEnum):
25682582 MODEL_TENSOR .FFN_GATE_EXP ,
25692583 MODEL_TENSOR .FFN_DOWN_EXP ,
25702584 MODEL_TENSOR .FFN_UP_EXP ,
2585+ MODEL_TENSOR .FFN_GATE_UP_EXP ,
25712586 MODEL_TENSOR .FFN_GATE_SHEXP ,
25722587 MODEL_TENSOR .FFN_DOWN_SHEXP ,
25732588 MODEL_TENSOR .FFN_UP_SHEXP ,
@@ -2620,6 +2635,7 @@ class MODEL_TENSOR(IntEnum):
26202635 MODEL_TENSOR .FFN_GATE_EXP ,
26212636 MODEL_TENSOR .FFN_DOWN_EXP ,
26222637 MODEL_TENSOR .FFN_UP_EXP ,
2638+ MODEL_TENSOR .FFN_GATE_UP_EXP ,
26232639 MODEL_TENSOR .FFN_GATE_SHEXP ,
26242640 MODEL_TENSOR .FFN_DOWN_SHEXP ,
26252641 MODEL_TENSOR .FFN_UP_SHEXP ,
@@ -2697,6 +2713,7 @@ class MODEL_TENSOR(IntEnum):
26972713 MODEL_TENSOR .FFN_GATE_EXP ,
26982714 MODEL_TENSOR .FFN_DOWN_EXP ,
26992715 MODEL_TENSOR .FFN_UP_EXP ,
2716+ MODEL_TENSOR .FFN_GATE_UP_EXP ,
27002717 MODEL_TENSOR .FFN_GATE_SHEXP ,
27012718 MODEL_TENSOR .FFN_DOWN_SHEXP ,
27022719 MODEL_TENSOR .FFN_UP_SHEXP ,
@@ -2951,6 +2968,7 @@ class MODEL_TENSOR(IntEnum):
29512968 MODEL_TENSOR .FFN_GATE_EXP ,
29522969 MODEL_TENSOR .FFN_DOWN_EXP ,
29532970 MODEL_TENSOR .FFN_UP_EXP ,
2971+ MODEL_TENSOR .FFN_GATE_UP_EXP ,
29542972 MODEL_TENSOR .FFN_GATE_SHEXP ,
29552973 MODEL_TENSOR .FFN_DOWN_SHEXP ,
29562974 MODEL_TENSOR .FFN_UP_SHEXP ,
@@ -2991,6 +3009,7 @@ class MODEL_TENSOR(IntEnum):
29913009 MODEL_TENSOR .FFN_GATE_EXP ,
29923010 MODEL_TENSOR .FFN_DOWN_EXP ,
29933011 MODEL_TENSOR .FFN_UP_EXP ,
3012+ MODEL_TENSOR .FFN_GATE_UP_EXP ,
29943013 MODEL_TENSOR .FFN_GATE_SHEXP ,
29953014 MODEL_TENSOR .FFN_UP_SHEXP ,
29963015 MODEL_TENSOR .FFN_DOWN_SHEXP ,
@@ -3017,6 +3036,7 @@ class MODEL_TENSOR(IntEnum):
30173036 MODEL_TENSOR .FFN_GATE_EXP ,
30183037 MODEL_TENSOR .FFN_DOWN_EXP ,
30193038 MODEL_TENSOR .FFN_UP_EXP ,
3039+ MODEL_TENSOR .FFN_GATE_UP_EXP ,
30203040 MODEL_TENSOR .FFN_GATE_SHEXP ,
30213041 MODEL_TENSOR .FFN_UP_SHEXP ,
30223042 MODEL_TENSOR .FFN_DOWN_SHEXP ,
@@ -3078,6 +3098,7 @@ class MODEL_TENSOR(IntEnum):
30783098 MODEL_TENSOR .FFN_GATE_EXP ,
30793099 MODEL_TENSOR .FFN_DOWN_EXP ,
30803100 MODEL_TENSOR .FFN_UP_EXP ,
3101+ MODEL_TENSOR .FFN_GATE_UP_EXP ,
30813102 MODEL_TENSOR .FFN_GATE_SHEXP ,
30823103 MODEL_TENSOR .FFN_DOWN_SHEXP ,
30833104 MODEL_TENSOR .FFN_UP_SHEXP ,
@@ -3100,6 +3121,7 @@ class MODEL_TENSOR(IntEnum):
31003121 MODEL_TENSOR .FFN_GATE_EXP ,
31013122 MODEL_TENSOR .FFN_DOWN_EXP ,
31023123 MODEL_TENSOR .FFN_UP_EXP ,
3124+ MODEL_TENSOR .FFN_GATE_UP_EXP ,
31033125 MODEL_TENSOR .FFN_GATE_SHEXP ,
31043126 MODEL_TENSOR .FFN_DOWN_SHEXP ,
31053127 MODEL_TENSOR .FFN_UP_SHEXP ,
@@ -3134,6 +3156,7 @@ class MODEL_TENSOR(IntEnum):
31343156 MODEL_TENSOR .FFN_UP ,
31353157 MODEL_TENSOR .FFN_UP_EXP ,
31363158 MODEL_TENSOR .FFN_UP_SHEXP ,
3159+ MODEL_TENSOR .FFN_GATE_UP_EXP ,
31373160 ],
31383161 MODEL_ARCH .ARCEE : [
31393162 MODEL_TENSOR .TOKEN_EMBD ,
@@ -3170,6 +3193,7 @@ class MODEL_TENSOR(IntEnum):
31703193 MODEL_TENSOR .FFN_GATE_EXP ,
31713194 MODEL_TENSOR .FFN_DOWN_EXP ,
31723195 MODEL_TENSOR .FFN_UP_EXP ,
3196+ MODEL_TENSOR .FFN_GATE_UP_EXP ,
31733197 MODEL_TENSOR .FFN_GATE_SHEXP ,
31743198 MODEL_TENSOR .FFN_UP_SHEXP ,
31753199 MODEL_TENSOR .FFN_DOWN_SHEXP ,
@@ -3256,6 +3280,7 @@ class MODEL_TENSOR(IntEnum):
32563280 MODEL_TENSOR .FFN_GATE_EXP ,
32573281 MODEL_TENSOR .FFN_DOWN_EXP ,
32583282 MODEL_TENSOR .FFN_UP_EXP ,
3283+ MODEL_TENSOR .FFN_GATE_UP_EXP ,
32593284 MODEL_TENSOR .FFN_GATE_SHEXP ,
32603285 MODEL_TENSOR .FFN_DOWN_SHEXP ,
32613286 MODEL_TENSOR .FFN_UP_SHEXP ,
@@ -3350,6 +3375,7 @@ class MODEL_TENSOR(IntEnum):
33503375 MODEL_TENSOR .FFN_GATE_EXP ,
33513376 MODEL_TENSOR .FFN_DOWN_EXP ,
33523377 MODEL_TENSOR .FFN_UP_EXP ,
3378+ MODEL_TENSOR .FFN_GATE_UP_EXP ,
33533379 MODEL_TENSOR .FFN_EXP_PROBS_B ,
33543380 ],
33553381 MODEL_ARCH .SMALLTHINKER : [
@@ -3369,6 +3395,7 @@ class MODEL_TENSOR(IntEnum):
33693395 MODEL_TENSOR .FFN_GATE_EXP ,
33703396 MODEL_TENSOR .FFN_DOWN_EXP ,
33713397 MODEL_TENSOR .FFN_UP_EXP ,
3398+ MODEL_TENSOR .FFN_GATE_UP_EXP ,
33723399 ],
33733400 MODEL_ARCH .APERTUS : [
33743401 MODEL_TENSOR .TOKEN_EMBD ,
@@ -3404,6 +3431,7 @@ class MODEL_TENSOR(IntEnum):
34043431 MODEL_TENSOR .FFN_GATE_EXP ,
34053432 MODEL_TENSOR .FFN_UP_EXP ,
34063433 MODEL_TENSOR .FFN_DOWN_EXP ,
3434+ MODEL_TENSOR .FFN_GATE_UP_EXP ,
34073435 ],
34083436 MODEL_ARCH .GROVEMOE : [
34093437 MODEL_TENSOR .TOKEN_EMBD ,
@@ -3421,6 +3449,7 @@ class MODEL_TENSOR(IntEnum):
34213449 MODEL_TENSOR .FFN_GATE_EXP ,
34223450 MODEL_TENSOR .FFN_DOWN_EXP ,
34233451 MODEL_TENSOR .FFN_UP_EXP ,
3452+ MODEL_TENSOR .FFN_GATE_UP_EXP ,
34243453 MODEL_TENSOR .FFN_GATE_CHEXP ,
34253454 MODEL_TENSOR .FFN_DOWN_CHEXP ,
34263455 MODEL_TENSOR .FFN_UP_CHEXP ,
@@ -3441,6 +3470,7 @@ class MODEL_TENSOR(IntEnum):
34413470 MODEL_TENSOR .FFN_GATE_EXP ,
34423471 MODEL_TENSOR .FFN_DOWN_EXP ,
34433472 MODEL_TENSOR .FFN_UP_EXP ,
3473+ MODEL_TENSOR .FFN_GATE_UP_EXP ,
34443474 MODEL_TENSOR .FFN_EXP_PROBS_B ,
34453475 ],
34463476 MODEL_ARCH .COGVLM : [
@@ -3476,6 +3506,7 @@ class MODEL_TENSOR(IntEnum):
34763506 MODEL_TENSOR .FFN_GATE_EXP ,
34773507 MODEL_TENSOR .FFN_DOWN_EXP ,
34783508 MODEL_TENSOR .FFN_UP_EXP ,
3509+ MODEL_TENSOR .FFN_GATE_UP_EXP ,
34793510 ],
34803511 MODEL_ARCH .PANGU_EMBED : [
34813512 MODEL_TENSOR .TOKEN_EMBD ,
@@ -3510,6 +3541,7 @@ class MODEL_TENSOR(IntEnum):
35103541 MODEL_TENSOR .FFN_GATE_EXP ,
35113542 MODEL_TENSOR .FFN_DOWN_EXP ,
35123543 MODEL_TENSOR .FFN_UP_EXP ,
3544+ MODEL_TENSOR .FFN_GATE_UP_EXP ,
35133545 ],
35143546 MODEL_ARCH .MIMO2 : [
35153547 MODEL_TENSOR .TOKEN_EMBD ,
@@ -3529,6 +3561,7 @@ class MODEL_TENSOR(IntEnum):
35293561 MODEL_TENSOR .FFN_GATE_EXP ,
35303562 MODEL_TENSOR .FFN_DOWN_EXP ,
35313563 MODEL_TENSOR .FFN_UP_EXP ,
3564+ MODEL_TENSOR .FFN_GATE_UP_EXP ,
35323565 MODEL_TENSOR .FFN_EXP_PROBS_B ,
35333566 ],
35343567 MODEL_ARCH .STEP35 : [
@@ -3576,6 +3609,7 @@ class MODEL_TENSOR(IntEnum):
35763609 MODEL_TENSOR .FFN_GATE_EXP ,
35773610 MODEL_TENSOR .FFN_DOWN_EXP ,
35783611 MODEL_TENSOR .FFN_UP_EXP ,
3612+ MODEL_TENSOR .FFN_GATE_UP_EXP ,
35793613 ],
35803614 MODEL_ARCH .MAINCODER : [
35813615 MODEL_TENSOR .TOKEN_EMBD ,
0 commit comments