File tree 1 file changed +164
-0
lines changed
vllm/model_executor/layers/fused_moe/configs
1 file changed +164
-0
lines changed Original file line number Diff line number Diff line change
1
+ {
2
+ "1" : {
3
+ "BLOCK_SIZE_M" : 16 ,
4
+ "BLOCK_SIZE_N" : 128 ,
5
+ "BLOCK_SIZE_K" : 256 ,
6
+ "GROUP_SIZE_M" : 1 ,
7
+ "num_warps" : 8 ,
8
+ "num_stages" : 2 ,
9
+ "waves_per_eu" : 0
10
+ },
11
+ "2" : {
12
+ "BLOCK_SIZE_M" : 16 ,
13
+ "BLOCK_SIZE_N" : 128 ,
14
+ "BLOCK_SIZE_K" : 256 ,
15
+ "GROUP_SIZE_M" : 1 ,
16
+ "num_warps" : 8 ,
17
+ "num_stages" : 2 ,
18
+ "waves_per_eu" : 0
19
+ },
20
+ "4" : {
21
+ "BLOCK_SIZE_M" : 16 ,
22
+ "BLOCK_SIZE_N" : 128 ,
23
+ "BLOCK_SIZE_K" : 256 ,
24
+ "GROUP_SIZE_M" : 1 ,
25
+ "num_warps" : 8 ,
26
+ "num_stages" : 2 ,
27
+ "waves_per_eu" : 0
28
+ },
29
+ "8" : {
30
+ "BLOCK_SIZE_M" : 16 ,
31
+ "BLOCK_SIZE_N" : 128 ,
32
+ "BLOCK_SIZE_K" : 128 ,
33
+ "GROUP_SIZE_M" : 1 ,
34
+ "num_warps" : 8 ,
35
+ "num_stages" : 2 ,
36
+ "waves_per_eu" : 0
37
+ },
38
+ "16" : {
39
+ "BLOCK_SIZE_M" : 16 ,
40
+ "BLOCK_SIZE_N" : 128 ,
41
+ "BLOCK_SIZE_K" : 128 ,
42
+ "GROUP_SIZE_M" : 1 ,
43
+ "num_warps" : 8 ,
44
+ "num_stages" : 2 ,
45
+ "waves_per_eu" : 0
46
+ },
47
+ "24" : {
48
+ "BLOCK_SIZE_M" : 16 ,
49
+ "BLOCK_SIZE_N" : 128 ,
50
+ "BLOCK_SIZE_K" : 128 ,
51
+ "GROUP_SIZE_M" : 1 ,
52
+ "num_warps" : 4 ,
53
+ "num_stages" : 2 ,
54
+ "waves_per_eu" : 0
55
+ },
56
+ "32" : {
57
+ "BLOCK_SIZE_M" : 16 ,
58
+ "BLOCK_SIZE_N" : 128 ,
59
+ "BLOCK_SIZE_K" : 256 ,
60
+ "GROUP_SIZE_M" : 1 ,
61
+ "num_warps" : 4 ,
62
+ "num_stages" : 2 ,
63
+ "waves_per_eu" : 0
64
+ },
65
+ "48" : {
66
+ "BLOCK_SIZE_M" : 16 ,
67
+ "BLOCK_SIZE_N" : 128 ,
68
+ "BLOCK_SIZE_K" : 128 ,
69
+ "GROUP_SIZE_M" : 1 ,
70
+ "num_warps" : 8 ,
71
+ "num_stages" : 2 ,
72
+ "waves_per_eu" : 0
73
+ },
74
+ "64" : {
75
+ "BLOCK_SIZE_M" : 16 ,
76
+ "BLOCK_SIZE_N" : 128 ,
77
+ "BLOCK_SIZE_K" : 256 ,
78
+ "GROUP_SIZE_M" : 4 ,
79
+ "num_warps" : 8 ,
80
+ "num_stages" : 2 ,
81
+ "waves_per_eu" : 0
82
+ },
83
+ "96" : {
84
+ "BLOCK_SIZE_M" : 16 ,
85
+ "BLOCK_SIZE_N" : 128 ,
86
+ "BLOCK_SIZE_K" : 128 ,
87
+ "GROUP_SIZE_M" : 1 ,
88
+ "num_warps" : 8 ,
89
+ "num_stages" : 2 ,
90
+ "waves_per_eu" : 0
91
+ },
92
+ "128" : {
93
+ "BLOCK_SIZE_M" : 16 ,
94
+ "BLOCK_SIZE_N" : 128 ,
95
+ "BLOCK_SIZE_K" : 256 ,
96
+ "GROUP_SIZE_M" : 1 ,
97
+ "num_warps" : 8 ,
98
+ "num_stages" : 2 ,
99
+ "waves_per_eu" : 0
100
+ },
101
+ "256" : {
102
+ "BLOCK_SIZE_M" : 32 ,
103
+ "BLOCK_SIZE_N" : 128 ,
104
+ "BLOCK_SIZE_K" : 128 ,
105
+ "GROUP_SIZE_M" : 1 ,
106
+ "num_warps" : 4 ,
107
+ "num_stages" : 2 ,
108
+ "waves_per_eu" : 0
109
+ },
110
+ "512" : {
111
+ "BLOCK_SIZE_M" : 64 ,
112
+ "BLOCK_SIZE_N" : 128 ,
113
+ "BLOCK_SIZE_K" : 128 ,
114
+ "GROUP_SIZE_M" : 8 ,
115
+ "num_warps" : 8 ,
116
+ "num_stages" : 2 ,
117
+ "waves_per_eu" : 0
118
+ },
119
+ "1024" : {
120
+ "BLOCK_SIZE_M" : 128 ,
121
+ "BLOCK_SIZE_N" : 128 ,
122
+ "BLOCK_SIZE_K" : 128 ,
123
+ "GROUP_SIZE_M" : 8 ,
124
+ "num_warps" : 8 ,
125
+ "num_stages" : 2 ,
126
+ "waves_per_eu" : 0
127
+ },
128
+ "1536" : {
129
+ "BLOCK_SIZE_M" : 128 ,
130
+ "BLOCK_SIZE_N" : 128 ,
131
+ "BLOCK_SIZE_K" : 128 ,
132
+ "GROUP_SIZE_M" : 8 ,
133
+ "num_warps" : 8 ,
134
+ "num_stages" : 2 ,
135
+ "waves_per_eu" : 0
136
+ },
137
+ "2048" : {
138
+ "BLOCK_SIZE_M" : 128 ,
139
+ "BLOCK_SIZE_N" : 128 ,
140
+ "BLOCK_SIZE_K" : 128 ,
141
+ "GROUP_SIZE_M" : 4 ,
142
+ "num_warps" : 8 ,
143
+ "num_stages" : 2 ,
144
+ "waves_per_eu" : 0
145
+ },
146
+ "3072" : {
147
+ "BLOCK_SIZE_M" : 128 ,
148
+ "BLOCK_SIZE_N" : 128 ,
149
+ "BLOCK_SIZE_K" : 256 ,
150
+ "GROUP_SIZE_M" : 1 ,
151
+ "num_warps" : 8 ,
152
+ "num_stages" : 2 ,
153
+ "waves_per_eu" : 0
154
+ },
155
+ "4096" : {
156
+ "BLOCK_SIZE_M" : 128 ,
157
+ "BLOCK_SIZE_N" : 128 ,
158
+ "BLOCK_SIZE_K" : 256 ,
159
+ "GROUP_SIZE_M" : 4 ,
160
+ "num_warps" : 8 ,
161
+ "num_stages" : 2 ,
162
+ "waves_per_eu" : 0
163
+ }
164
+ }
You can’t perform that action at this time.
0 commit comments