Skip to content

Commit cc1d2cc

Browse files
committed
thor's __CUDA_ARCH__ is 1010 instead of 1100
1 parent 43a0d3a commit cc1d2cc

File tree

2 files changed

+2
-2
lines changed

2 files changed

+2
-2
lines changed

csrc/xqa/mha.cu

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -93,7 +93,7 @@ __constant__ constexpr uint32_t cacheVTileSeqLen = 32;
9393
constexpr uint32_t preferedKHeadPartBytes = 64;
9494
__constant__ constexpr uint32_t cacheVTileSeqLen = 32;
9595
#elif __CUDA_ARCH__ == 800 || __CUDA_ARCH__ == 870 || __CUDA_ARCH__ == 900 || \
96-
__CUDA_ARCH__ == 1000 || __CUDA_ARCH__ == 1030 || __CUDA_ARCH__ == 1100
96+
__CUDA_ARCH__ == 1000 || __CUDA_ARCH__ == 1030 || __CUDA_ARCH__ == 1010
9797
constexpr uint32_t preferedKHeadPartBytes = 128;
9898
__constant__ constexpr uint32_t cacheVTileSeqLen = 64;
9999
#else

csrc/xqa/utils.cuh

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -47,7 +47,7 @@ constexpr uint32_t kMAX_SMEM_SIZE = (99u << 10);
4747
#elif __CUDA_ARCH__ == 800 || __CUDA_ARCH__ == 870
4848
constexpr uint32_t kMAX_SMEM_SIZE = (163u << 10);
4949
#elif __CUDA_ARCH__ == 900 || __CUDA_ARCH__ == 1000 || __CUDA_ARCH__ == 1030 || \
50-
__CUDA_ARCH__ == 1100
50+
__CUDA_ARCH__ == 1010
5151
constexpr uint32_t kMAX_SMEM_SIZE = (227u << 10);
5252
#endif
5353
#endif

0 commit comments

Comments
 (0)