We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 521fe01 commit 51812f1Copy full SHA for 51812f1
csrc/fused_moe/moeTopKFuncs.cuh
@@ -23,14 +23,14 @@
23
24
#include <cub/cub.cuh>
25
26
-#include "tensorrt_llm/kernels/archCondition.h"
+#include "flashinfer/arch_condition.h"
27
28
namespace tensorrt_llm::kernels {
29
30
namespace reduce_topk {
31
namespace cg = cooperative_groups;
32
static constexpr int kWARP_SIZE = 32;
33
-static constexpr bool kTLLM_GEN_HAS_FAST_REDUX = tensorrt_llm::kernels::arch::is_major_v<10>;
+static constexpr bool kTLLM_GEN_HAS_FAST_REDUX = flashinfer::arch::is_major_v<10>;
34
35
template <typename T_>
36
struct TopKRedType {
csrc/nv_internal/tensorrt_llm/kernels/archCondition.h
0 commit comments