diff --git a/third_party/amd/lib/TritonAMDGPUToLLVM/MemoryOpToLLVM.cpp b/third_party/amd/lib/TritonAMDGPUToLLVM/MemoryOpToLLVM.cpp index 78226c707886..323900cf9df6 100644 --- a/third_party/amd/lib/TritonAMDGPUToLLVM/MemoryOpToLLVM.cpp +++ b/third_party/amd/lib/TritonAMDGPUToLLVM/MemoryOpToLLVM.cpp @@ -187,7 +187,7 @@ class TransLocalLoadOpConversion // If we are lowering a subslice, the subslice offsets shall not touch the // contiguous part of the tile - if (maskSpanAffineOffset & (tile.getOutDimSizeLog2(kOffset) - 1)) { + if (maskSpanAffineOffset & (tile.getOutDimSize(kOffset) - 1)) { return failure(); } diff --git a/third_party/nvidia/lib/TritonNVIDIAGPUToLLVM/Utility.cpp b/third_party/nvidia/lib/TritonNVIDIAGPUToLLVM/Utility.cpp index c2aff0a770b0..5571af976b91 100644 --- a/third_party/nvidia/lib/TritonNVIDIAGPUToLLVM/Utility.cpp +++ b/third_party/nvidia/lib/TritonNVIDIAGPUToLLVM/Utility.cpp @@ -332,7 +332,7 @@ LogicalResult lowerLdStMatrix( // If we are lowering a subslice, the subslice offsets shall not touch the // contiguous part of the tile - if (maskSpanAffineOffset & (tile.getOutDimSizeLog2(kOffset) - 1)) { + if (maskSpanAffineOffset & (tile.getOutDimSize(kOffset) - 1)) { return failure(); }