Skip to content
Merged
Show file tree
Hide file tree
Changes from 3 commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
2 changes: 1 addition & 1 deletion 3rdparty/cutlass
Submodule cutlass updated 175 files
Original file line number Diff line number Diff line change
Expand Up @@ -138,22 +138,23 @@ void dispatchMoeGemmFinalDispatchTmaWarpSpecialized(TmaWarpSpecializedGroupedGem
TLLM_THROW("Please recompile with support for hopper by passing 90-real as an arch to build_wheel.py.");
}
#endif
// #ifndef COMPILE_BLACKWELL_SM103_TMA_GROUPED_GEMMS
#ifndef COMPILE_BLACKWELL_SM103_TMA_GROUPED_GEMMS
else if constexpr (Arch::kMinComputeCapability == 103)
{
static std::once_flag flag;
std::call_once(flag,
[]()
{
TLLM_LOG_WARNING(
"Falling back to sm100f version due to a bug in cutlass." /*"For best performance please recompile with support for blackwell by "
"passing 103-real as an arch to build_wheel.py."*/);
"For best performance please recompile with support for blackwell by "
"passing 103-real as an arch to build_wheel.py.");
});
return dispatchMoeGemmFinalDispatchTmaWarpSpecialized<cutlass::arch::Sm100, T, WeightType, OutputType,
EpilogueTag, FUSION, TileShape, ClusterShape>(
dispatchMoeGemmFinalDispatchTmaWarpSpecialized<cutlass::arch::Sm100, T, WeightType, OutputType, EpilogueTag,
FUSION, TileShape, ClusterShape>(
hopper_input, num_experts, gemm_config, multi_processor_count, stream, occupancy, workspace_size);
return;
}
// #endif
#endif
#ifndef COMPILE_BLACKWELL_TMA_GROUPED_GEMMS
else if constexpr (Arch::kMinComputeCapability >= 100 && Arch::kMinComputeCapability < 120)
{
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -3,19 +3,6 @@
import os
from itertools import chain, product

file_to_patch = os.path.abspath(
os.path.join(
os.path.dirname(__file__),
"../../../../../3rdparty/cutlass/python/cutlass_library/heuristics_provider.py"
))
# replace "from library import" to "from cutlass_library.library import"
with open(file_to_patch, "r") as f:
file_contents = f.read()
with open(file_to_patch, "w") as f:
f.write(
file_contents.replace("from library import",
"from cutlass_library.library import"))

from cutlass_library import *


Expand Down
Loading