We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 0760ab0 commit c796f47Copy full SHA for c796f47
src/runtime/contrib/cutlass/weight_preprocess.cc
@@ -39,7 +39,7 @@ namespace runtime {
39
TVM_REGISTER_GLOBAL("cutlass.ft_preprocess_weight")
40
.set_body_typed([](NDArray packed_weight, int sm, bool is_int4) {
41
bool is_2d = packed_weight->ndim == 2;
42
- int num_experts = 1;
+ int num_experts = is_2d ? 1 : packed_weight->shape[0];
43
int rows = packed_weight->shape[is_2d ? 0 : 1];
44
int cols = packed_weight->shape[is_2d ? 1 : 2];
45
0 commit comments