From 472d3271e68b56489ee5cff6f610fbc122e7631d Mon Sep 17 00:00:00 2001 From: RxZ Date: Thu, 22 Jan 2026 11:24:36 +0800 Subject: [PATCH] chunk_gated_delta_rule_npu output final state --- python/sgl_kernel_npu/sgl_kernel_npu/fla/chunk.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/python/sgl_kernel_npu/sgl_kernel_npu/fla/chunk.py b/python/sgl_kernel_npu/sgl_kernel_npu/fla/chunk.py index b7d50b673..220bfcc2e 100644 --- a/python/sgl_kernel_npu/sgl_kernel_npu/fla/chunk.py +++ b/python/sgl_kernel_npu/sgl_kernel_npu/fla/chunk.py @@ -234,7 +234,7 @@ def chunk_gated_delta_rule_npu( beta: torch.Tensor, scale: float = None, initial_state: torch.Tensor = None, - output_final_state: bool = False, + output_final_state: bool = True, cu_seqlens: Optional[torch.LongTensor] = None, head_first: bool = False, use_qk_l2norm_in_kernel: bool = False,