Skip to content

Commit dad541c

Browse files
author
nicunxiao
committed
new format
1 parent e448754 commit dad541c

File tree

2 files changed

+18
-6
lines changed

2 files changed

+18
-6
lines changed

src/tl_templates/cuda/gemm_mma.h

Lines changed: 9 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -257,9 +257,15 @@ struct OperandTraits<64, N, K, false, num_warp_n, leading_dim,
257257
using Copy = DefaultCopy;
258258
};
259259

260-
template<typename T> struct to_cute_type {using type = T;};
261-
template<> struct to_cute_type<tl::float_e4m3_t> {using type = cute::float_e4m3_t;};
262-
template<> struct to_cute_type<tl::float_e5m2_t> {using type = cute::float_e5m2_t;};
260+
template <typename T> struct to_cute_type {
261+
using type = T;
262+
};
263+
template <> struct to_cute_type<tl::float_e4m3_t> {
264+
using type = cute::float_e4m3_t;
265+
};
266+
template <> struct to_cute_type<tl::float_e5m2_t> {
267+
using type = cute::float_e5m2_t;
268+
};
263269

264270
template <int M, int N, int K, int num_warp_m, int num_warp_n, bool trans_A,
265271
bool trans_B, bool clear_accum, int lda, int ldb, int offset_a,

src/tl_templates/cuda/gemm_sm90.h

Lines changed: 9 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -15,9 +15,15 @@ using namespace SM90;
1515
namespace tl_wgmma {
1616

1717
using namespace cutlass::gemm::collective::detail; // ss_smem_selector
18-
template<typename T> struct to_cute_type {using type = T;};
19-
template<> struct to_cute_type<tl::float_e4m3_t> {using type = cute::float_e4m3_t;};
20-
template<> struct to_cute_type<tl::float_e5m2_t> {using type = cute::float_e5m2_t;};
18+
template <typename T> struct to_cute_type {
19+
using type = T;
20+
};
21+
template <> struct to_cute_type<tl::float_e4m3_t> {
22+
using type = cute::float_e4m3_t;
23+
};
24+
template <> struct to_cute_type<tl::float_e5m2_t> {
25+
using type = cute::float_e5m2_t;
26+
};
2127

2228
template <int M, int N, int K, int num_warp_m, int num_warp_n, bool trans_A,
2329
bool trans_B, bool clear_accum, typename A_type_raw,

0 commit comments

Comments
 (0)