Skip to content

Commit d9efc04

Browse files
committed
tuning config on h200
1 parent 0c9a293 commit d9efc04

File tree

3 files changed

+70
-1
lines changed

3 files changed

+70
-1
lines changed

lightllm/common/fused_moe/grouped_fused_moe.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -273,7 +273,7 @@ def _get_moe_align_fused_configs():
273273
}
274274
for ns in [2, 3, 4, 5]
275275
for nw in [4, 8]
276-
for bt in [1024, 2048]
276+
for bt in [128, 256, 512, 1024, 2048]
277277
]
278278

279279

Original file line numberDiff line numberDiff line change
@@ -0,0 +1,7 @@
1+
{
2+
"8448": {
3+
"BLOCK_TOK": 128,
4+
"num_stages": 5,
5+
"num_warps": 4
6+
}
7+
}
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,62 @@
1+
{
2+
"1": {
3+
"BLOCK_TOK": 256,
4+
"num_stages": 2,
5+
"num_warps": 8
6+
},
7+
"100": {
8+
"BLOCK_TOK": 128,
9+
"num_stages": 2,
10+
"num_warps": 4
11+
},
12+
"1024": {
13+
"BLOCK_TOK": 256,
14+
"num_stages": 3,
15+
"num_warps": 8
16+
},
17+
"128": {
18+
"BLOCK_TOK": 128,
19+
"num_stages": 5,
20+
"num_warps": 4
21+
},
22+
"16": {
23+
"BLOCK_TOK": 256,
24+
"num_stages": 5,
25+
"num_warps": 8
26+
},
27+
"2048": {
28+
"BLOCK_TOK": 256,
29+
"num_stages": 3,
30+
"num_warps": 8
31+
},
32+
"256": {
33+
"BLOCK_TOK": 128,
34+
"num_stages": 5,
35+
"num_warps": 4
36+
},
37+
"32": {
38+
"BLOCK_TOK": 128,
39+
"num_stages": 5,
40+
"num_warps": 4
41+
},
42+
"4096": {
43+
"BLOCK_TOK": 256,
44+
"num_stages": 2,
45+
"num_warps": 8
46+
},
47+
"64": {
48+
"BLOCK_TOK": 128,
49+
"num_stages": 2,
50+
"num_warps": 4
51+
},
52+
"8": {
53+
"BLOCK_TOK": 256,
54+
"num_stages": 2,
55+
"num_warps": 4
56+
},
57+
"8448": {
58+
"BLOCK_TOK": 128,
59+
"num_stages": 4,
60+
"num_warps": 4
61+
}
62+
}

0 commit comments

Comments
 (0)