File tree Expand file tree Collapse file tree 1 file changed +164
-0
lines changed
vllm/model_executor/layers/fused_moe/configs Expand file tree Collapse file tree 1 file changed +164
-0
lines changed Original file line number Diff line number Diff line change 1+ {
2+ "1" : {
3+ "BLOCK_SIZE_M" : 16 ,
4+ "BLOCK_SIZE_N" : 128 ,
5+ "BLOCK_SIZE_K" : 256 ,
6+ "GROUP_SIZE_M" : 1 ,
7+ "num_warps" : 8 ,
8+ "num_stages" : 2 ,
9+ "waves_per_eu" : 0
10+ },
11+ "2" : {
12+ "BLOCK_SIZE_M" : 16 ,
13+ "BLOCK_SIZE_N" : 128 ,
14+ "BLOCK_SIZE_K" : 128 ,
15+ "GROUP_SIZE_M" : 1 ,
16+ "num_warps" : 8 ,
17+ "num_stages" : 2 ,
18+ "waves_per_eu" : 0
19+ },
20+ "4" : {
21+ "BLOCK_SIZE_M" : 16 ,
22+ "BLOCK_SIZE_N" : 128 ,
23+ "BLOCK_SIZE_K" : 128 ,
24+ "GROUP_SIZE_M" : 1 ,
25+ "num_warps" : 8 ,
26+ "num_stages" : 2 ,
27+ "waves_per_eu" : 0
28+ },
29+ "8" : {
30+ "BLOCK_SIZE_M" : 16 ,
31+ "BLOCK_SIZE_N" : 128 ,
32+ "BLOCK_SIZE_K" : 128 ,
33+ "GROUP_SIZE_M" : 1 ,
34+ "num_warps" : 8 ,
35+ "num_stages" : 2 ,
36+ "waves_per_eu" : 0
37+ },
38+ "16" : {
39+ "BLOCK_SIZE_M" : 16 ,
40+ "BLOCK_SIZE_N" : 128 ,
41+ "BLOCK_SIZE_K" : 128 ,
42+ "GROUP_SIZE_M" : 4 ,
43+ "num_warps" : 8 ,
44+ "num_stages" : 2 ,
45+ "waves_per_eu" : 0
46+ },
47+ "24" : {
48+ "BLOCK_SIZE_M" : 16 ,
49+ "BLOCK_SIZE_N" : 128 ,
50+ "BLOCK_SIZE_K" : 128 ,
51+ "GROUP_SIZE_M" : 1 ,
52+ "num_warps" : 8 ,
53+ "num_stages" : 2 ,
54+ "waves_per_eu" : 0
55+ },
56+ "32" : {
57+ "BLOCK_SIZE_M" : 16 ,
58+ "BLOCK_SIZE_N" : 128 ,
59+ "BLOCK_SIZE_K" : 256 ,
60+ "GROUP_SIZE_M" : 8 ,
61+ "num_warps" : 8 ,
62+ "num_stages" : 2 ,
63+ "waves_per_eu" : 0
64+ },
65+ "48" : {
66+ "BLOCK_SIZE_M" : 16 ,
67+ "BLOCK_SIZE_N" : 128 ,
68+ "BLOCK_SIZE_K" : 256 ,
69+ "GROUP_SIZE_M" : 1 ,
70+ "num_warps" : 8 ,
71+ "num_stages" : 2 ,
72+ "waves_per_eu" : 0
73+ },
74+ "64" : {
75+ "BLOCK_SIZE_M" : 16 ,
76+ "BLOCK_SIZE_N" : 128 ,
77+ "BLOCK_SIZE_K" : 128 ,
78+ "GROUP_SIZE_M" : 1 ,
79+ "num_warps" : 8 ,
80+ "num_stages" : 2 ,
81+ "waves_per_eu" : 0
82+ },
83+ "96" : {
84+ "BLOCK_SIZE_M" : 16 ,
85+ "BLOCK_SIZE_N" : 128 ,
86+ "BLOCK_SIZE_K" : 256 ,
87+ "GROUP_SIZE_M" : 8 ,
88+ "num_warps" : 8 ,
89+ "num_stages" : 2 ,
90+ "waves_per_eu" : 0
91+ },
92+ "128" : {
93+ "BLOCK_SIZE_M" : 16 ,
94+ "BLOCK_SIZE_N" : 128 ,
95+ "BLOCK_SIZE_K" : 128 ,
96+ "GROUP_SIZE_M" : 1 ,
97+ "num_warps" : 8 ,
98+ "num_stages" : 2 ,
99+ "waves_per_eu" : 0
100+ },
101+ "256" : {
102+ "BLOCK_SIZE_M" : 32 ,
103+ "BLOCK_SIZE_N" : 128 ,
104+ "BLOCK_SIZE_K" : 256 ,
105+ "GROUP_SIZE_M" : 1 ,
106+ "num_warps" : 4 ,
107+ "num_stages" : 2 ,
108+ "waves_per_eu" : 0
109+ },
110+ "512" : {
111+ "BLOCK_SIZE_M" : 64 ,
112+ "BLOCK_SIZE_N" : 128 ,
113+ "BLOCK_SIZE_K" : 128 ,
114+ "GROUP_SIZE_M" : 4 ,
115+ "num_warps" : 8 ,
116+ "num_stages" : 2 ,
117+ "waves_per_eu" : 0
118+ },
119+ "1024" : {
120+ "BLOCK_SIZE_M" : 128 ,
121+ "BLOCK_SIZE_N" : 128 ,
122+ "BLOCK_SIZE_K" : 256 ,
123+ "GROUP_SIZE_M" : 1 ,
124+ "num_warps" : 8 ,
125+ "num_stages" : 2 ,
126+ "waves_per_eu" : 0
127+ },
128+ "1536" : {
129+ "BLOCK_SIZE_M" : 128 ,
130+ "BLOCK_SIZE_N" : 128 ,
131+ "BLOCK_SIZE_K" : 256 ,
132+ "GROUP_SIZE_M" : 4 ,
133+ "num_warps" : 8 ,
134+ "num_stages" : 2 ,
135+ "waves_per_eu" : 0
136+ },
137+ "2048" : {
138+ "BLOCK_SIZE_M" : 128 ,
139+ "BLOCK_SIZE_N" : 128 ,
140+ "BLOCK_SIZE_K" : 128 ,
141+ "GROUP_SIZE_M" : 4 ,
142+ "num_warps" : 8 ,
143+ "num_stages" : 2 ,
144+ "waves_per_eu" : 0
145+ },
146+ "3072" : {
147+ "BLOCK_SIZE_M" : 128 ,
148+ "BLOCK_SIZE_N" : 128 ,
149+ "BLOCK_SIZE_K" : 256 ,
150+ "GROUP_SIZE_M" : 1 ,
151+ "num_warps" : 8 ,
152+ "num_stages" : 2 ,
153+ "waves_per_eu" : 0
154+ },
155+ "4096" : {
156+ "BLOCK_SIZE_M" : 128 ,
157+ "BLOCK_SIZE_N" : 128 ,
158+ "BLOCK_SIZE_K" : 256 ,
159+ "GROUP_SIZE_M" : 1 ,
160+ "num_warps" : 8 ,
161+ "num_stages" : 2 ,
162+ "waves_per_eu" : 0
163+ }
164+ }
You can’t perform that action at this time.
0 commit comments