File tree Expand file tree Collapse file tree 1 file changed +4
-0
lines changed
include/flashinfer/trtllm/fmha Expand file tree Collapse file tree 1 file changed +4
-0
lines changed Original file line number Diff line number Diff line change @@ -152,6 +152,8 @@ struct KernelParams {
152152 int32_t mStartTokenIdxSfO ;
153153 // The sum of sequence lengths for Q and K/V.
154154 int32_t mSumOfSeqLensQ , mSumOfSeqLensKv ;
155+ // The flag to use block sparse attention.
156+ bool mUseBlockSparseAttention ;
155157
156158 // Create the TMA shape/stride for Q.
157159 template <class FmhaOptions >
@@ -699,6 +701,8 @@ struct KernelParams {
699701 params.mStartTokenIdxSfO = options.mSfStartTokenIdx ;
700702 params.mScaleSfKv = options.mScaleSfKv ;
701703 params.ptrSoftmaxStats = options.softmaxStatsPtr ;
704+ // TODO: Integrate trtllm block-sparse attention kernels when needed.
705+ params.mUseBlockSparseAttention = false ;
702706 return params;
703707 }
704708};
You can’t perform that action at this time.
0 commit comments