[DAG] computeKnownBits - add CTLS handling by stomfaig · Pull Request #174824 · llvm/llvm-project

stomfaig · 2026-01-07T18:31:11Z

Add handling for CTLS using the same method as in #174636.

Added tests to AArch64 and RISCV, but it seems that ARM is actually resolving llvm.arm.cls to clz, so not tests added there.

llvmbot · 2026-01-07T18:37:55Z

@llvm/pr-subscribers-backend-risc-v
@llvm/pr-subscribers-llvm-selectiondag

@llvm/pr-subscribers-backend-aarch64

Author: Gergo Stomfai (stomfaig)

Changes

Add handling for CTLS using the same method as in #174636.

Added tests to AArch64 and RISCV, but it seems that ARM is actually resolving llvm.arm.cls to clz, so not tests added there.

Full diff: https://github.com/llvm/llvm-project/pull/174824.diff

3 Files Affected:

(modified) llvm/lib/CodeGen/SelectionDAG/SelectionDAG.cpp (+8)
(modified) llvm/test/CodeGen/AArch64/cls.ll (+78)
(modified) llvm/test/CodeGen/RISCV/rv32p.ll (+65)

diff --git a/llvm/lib/CodeGen/SelectionDAG/SelectionDAG.cpp b/llvm/lib/CodeGen/SelectionDAG/SelectionDAG.cpp
index 15f86cb94f958..ba130a78a1af7 100644
--- a/llvm/lib/CodeGen/SelectionDAG/SelectionDAG.cpp
+++ b/llvm/lib/CodeGen/SelectionDAG/SelectionDAG.cpp
@@ -3870,6 +3870,14 @@ KnownBits SelectionDAG::computeKnownBits(SDValue Op, const APInt &DemandedElts,
     Known.Zero.setBitsFrom(LowBits);
     break;
   }
+  case ISD::CTLS: {
+    unsigned MinRedundantSignBits =
+        ComputeNumSignBits(Op.getOperand(0), DemandedElts, Depth + 1);
+    ConstantRange Range(APInt(BitWidth, MinRedundantSignBits),
+                        APInt(BitWidth, 32));
+    Known = Range.toKnownBits();
+    break;
+  }
   case ISD::CTPOP: {
     Known2 = computeKnownBits(Op.getOperand(0), DemandedElts, Depth + 1);
     // If we know some of the bits are zero, they can't be one.
diff --git a/llvm/test/CodeGen/AArch64/cls.ll b/llvm/test/CodeGen/AArch64/cls.ll
index f17ccf7d6f682..1eb6f7411a49d 100644
--- a/llvm/test/CodeGen/AArch64/cls.ll
+++ b/llvm/test/CodeGen/AArch64/cls.ll
@@ -18,3 +18,81 @@ define i32 @cls64(i64 %t) {
 
 declare i32 @llvm.aarch64.cls(i32) nounwind
 declare i32 @llvm.aarch64.cls64(i64) nounwind
+
+define i8 @cls_i8(i8 %x) {
+; CHECK-LABEL: cls_i8:
+; CHECK:       // %bb.0:
+; CHECK-NEXT:    sxtb w8, w0 
+; CHECK-NEXT:    cls w8, w8 
+; CHECK-NEXT:    sub w0, w8, #24 
+; CHECK-NEXT:    ret
+
+  %a = ashr i8 %x, 7
+  %b = xor i8 %x, %a
+  %c = call i8 @llvm.ctlz.i8(i8 %b, i1 false)
+  %d = sub i8 %c, 1
+  ret i8 %d
+}
+
+; The result is in the range [1-31], so we don't need an andi after the cls.
+define i32 @cls_i32_knownbits(i32 %x) {
+; CHECK-LABEL: cls_i32_knownbits:
+; CHECK:       // %bb.0:
+; CHECK-NEXT:    cls	w0, w0
+; CHECK-NEXT:    ret
+  %a = ashr i32 %x, 31
+  %b = xor i32 %x, %a
+  %c = call i32 @llvm.ctlz.i32(i32 %b, i1 false)
+  %d = sub i32 %c, 1
+  %e = and i32 %d, 31
+  ret i32 %e
+}
+
+; There are at least 16 redundant sign bits so we don't need an ori after the clsw.
+define i32 @cls_i32_knownbits_2(i16 signext %x) {
+; CHECK-LABEL: cls_i32_knownbits_2:
+; CHECK:       // %bb.0:
+; CHECK-NEXT:    cls w0, w0
+; CHECK-NEXT:    ret
+  %sext = sext i16 %x to i32
+  %a = ashr i32 %sext, 31
+  %b = xor i32 %sext, %a
+  %c = call i32 @llvm.ctlz.i32(i32 %b, i1 false)
+  %d = sub i32 %c, 1
+  %e = or i32 %d, 16
+  ret i32 %e
+}
+
+; There are at least 24 redundant sign bits so we don't need an ori after the clsw.
+define i32 @cls_i32_knownbits_3(i8 signext %x) {
+; CHECK-LABEL: cls_i32_knownbits_3:
+; CHECK:       // %bb.0:
+; CHECK-NEXT:    cls	w0, w0
+; CHECK-NEXT:    ret
+  %sext = sext i8 %x to i32
+  %a = ashr i32 %sext, 31
+  %b = xor i32 %sext, %a
+  %c = call i32 @llvm.ctlz.i32(i32 %b, i1 false)
+  %d = sub i32 %c, 1
+  %e = or i32 %d, 24
+  ret i32 %e
+}
+
+; Negative test. We only know there is at least 1 redundant sign bit. We can't
+; remove the ori.
+define i32 @cls_i32_knownbits_4(i32 signext %x) {
+; CHECK-LABEL: cls_i32_knownbits_4:
+; CHECK:       // %bb.0:
+; CHECK-NEXT:   sbfx	w8, w0, #0, #31
+; CHECK-NEXT:	  cls	w8, w8
+; CHECK-NEXT:	  orr	w0, w8, #0x1
+; CHECK-NEXT:	  ret
+  %shl = shl i32 %x, 1
+  %ashr = ashr i32 %shl, 1
+  %a = ashr i32 %ashr, 31
+  %b = xor i32 %ashr, %a
+  %c = call i32 @llvm.ctlz.i32(i32 %b, i1 false)
+  %d = sub i32 %c, 1
+  %e = or i32 %d, 1
+  ret i32 %e
+ }
diff --git a/llvm/test/CodeGen/RISCV/rv32p.ll b/llvm/test/CodeGen/RISCV/rv32p.ll
index 9faac5df2a414..9611af1ee8c0e 100644
--- a/llvm/test/CodeGen/RISCV/rv32p.ll
+++ b/llvm/test/CodeGen/RISCV/rv32p.ll
@@ -234,6 +234,71 @@ define i64 @cls_i64_2(i64 %x) {
   ret i64 %e
 }
 
+; The result is in the range [1-31], so we don't need an andi after the cls.
+define i32 @cls_i32_knownbits(i32 %x) {
+; CHECK-LABEL: cls_i32_knownbits:
+; CHECK:       # %bb.0:
+; CHECK-NEXT:    cls	a0, a0
+; CHECK-NEXT:    ret
+  %a = ashr i32 %x, 31
+  %b = xor i32 %x, %a
+  %c = call i32 @llvm.ctlz.i32(i32 %b, i1 false)
+  %d = sub i32 %c, 1
+  %e = and i32 %d, 31
+  ret i32 %e
+}
+
+; There are at least 16 redundant sign bits so we don't need an ori after the clsw.
+define i32 @cls_i32_knownbits_2(i16 signext %x) {
+; CHECK-LABEL: cls_i32_knownbits_2:
+; CHECK:       # %bb.0:
+; CHECK-NEXT:    cls a0, a0
+; CHECK-NEXT:    ret
+  %sext = sext i16 %x to i32
+  %a = ashr i32 %sext, 31
+  %b = xor i32 %sext, %a
+  %c = call i32 @llvm.ctlz.i32(i32 %b, i1 false)
+  %d = sub i32 %c, 1
+  %e = or i32 %d, 16
+  ret i32 %e
+}
+
+; There are at least 24 redundant sign bits so we don't need an ori after the clsw.
+define i32 @cls_i32_knownbits_3(i8 signext %x) {
+; CHECK-LABEL: cls_i32_knownbits_3:
+; CHECK:       # %bb.0:
+; CHECK-NEXT:    cls	a0, a0
+; CHECK-NEXT:    ret
+  %sext = sext i8 %x to i32
+  %a = ashr i32 %sext, 31
+  %b = xor i32 %sext, %a
+  %c = call i32 @llvm.ctlz.i32(i32 %b, i1 false)
+  %d = sub i32 %c, 1
+  %e = or i32 %d, 24
+  ret i32 %e
+}
+
+; Negative test. We only know there is at least 1 redundant sign bit. We can't
+; remove the ori.
+define i32 @cls_i32_knownbits_4(i32 signext %x) {
+; CHECK-LABEL: cls_i32_knownbits_4:
+; CHECK:       # %bb.0:
+; CHECK-NEXT: slli a0, a0, 1
+; CHECK-NEXT: srai a0, a0, 1
+; CHECK-NEXT: cls a0, a0 
+; CHECK-NEXT: ori a0, a0, 1 
+; CHECK-NEXT: ret 
+  %shl = shl i32 %x, 1
+  %ashr = ashr i32 %shl, 1
+  %a = ashr i32 %ashr, 31
+  %b = xor i32 %ashr, %a
+  %c = call i32 @llvm.ctlz.i32(i32 %b, i1 false)
+  %d = sub i32 %c, 1
+  %e = or i32 %d, 1
+  ret i32 %e
+ }
+ 
+
 define i64 @slx_i64(i64 %x, i64 %y) {
 ; CHECK-LABEL: slx_i64:
 ; CHECK:       # %bb.0:

llvm/lib/CodeGen/SelectionDAG/SelectionDAG.cpp

github-actions · 2026-01-07T19:20:40Z

🐧 Linux x64 Test Results

188403 tests passed
5000 tests skipped

✅ The build succeeded and all tests passed.

topperc · 2026-01-07T22:36:04Z

Please add additional tests that would have caught the bugs.

github-actions · 2026-01-08T09:25:34Z

🪟 Windows x64 Test Results

129384 tests passed
2862 tests skipped

✅ The build succeeded and all tests passed.

llvm/test/CodeGen/RISCV/rv32p.ll

topperc

LGTM

Noticed when reviewing llvm#174824

Noticed when reviewing #174824

RKSimon

LGTM

Noticed when reviewing llvm#174824

Add handling for CTLS using the same method as in llvm#174636. Added tests to AArch64 and RISCV, but it seems that ARM is actually resolving `llvm.arm.cls` to `clz`, so not tests added there.

Noticed when reviewing llvm#174824

Add handling for CTLS using the same method as in llvm#174636. Added tests to AArch64 and RISCV, but it seems that ARM is actually resolving `llvm.arm.cls` to `clz`, so not tests added there.

stomfaig added 3 commits January 7, 2026 18:23

add handling CTLS in DAG

195c522

add tests

7b4c9e9

recover docstrings

e87003b

stomfaig changed the title ~~[DAG][GISel] computeKnownBits - add CTLS handling~~ [DAG] computeKnownBits - add CTLS handling Jan 7, 2026

llvmbot added backend:AArch64 backend:RISC-V llvm:SelectionDAG SelectionDAGISel as well labels Jan 7, 2026

topperc self-requested a review January 7, 2026 18:57

topperc reviewed Jan 7, 2026

View reviewed changes

llvm/lib/CodeGen/SelectionDAG/SelectionDAG.cpp Outdated Show resolved Hide resolved

llvm/lib/CodeGen/SelectionDAG/SelectionDAG.cpp Outdated Show resolved Hide resolved

correct left-in test logic and ctls semantics

5b83242

topperc requested a review from RKSimon January 7, 2026 22:36

fixed knownbits range max and knownbits overestimation test

2183625

fix tests

458d7cd

topperc reviewed Jan 12, 2026

View reviewed changes

llvm/test/CodeGen/RISCV/rv32p.ll Outdated Show resolved Hide resolved

stomfaig added 2 commits January 13, 2026 17:29

regen tests with update_llc_test_checks

cc207cc

remove unrelated change

5a71a9d

topperc approved these changes Jan 13, 2026

View reviewed changes

RKSimon mentioned this pull request Jan 14, 2026

[DAG][GISel] computeKnownBits - add CTLS handling #174370

Closed

RKSimon added a commit to RKSimon/llvm-project that referenced this pull request Jan 14, 2026

[AArch64] cls.ll - regenerate test checks

d0ec61e

Noticed when reviewing llvm#174824

RKSimon mentioned this pull request Jan 14, 2026

[AArch64] cls.ll - regenerate test checks #175948

Merged

RKSimon added a commit that referenced this pull request Jan 14, 2026

[AArch64] cls.ll - regenerate test checks (#175948)

d363c7f

Noticed when reviewing #174824

Merge branch 'main' into issue_174370

56c4f11

RKSimon approved these changes Jan 14, 2026

View reviewed changes

RKSimon enabled auto-merge (squash) January 14, 2026 14:30

RKSimon merged commit 5f31b9c into llvm:main Jan 14, 2026
10 of 11 checks passed

Priyanshu3820 pushed a commit to Priyanshu3820/llvm-project that referenced this pull request Jan 18, 2026

[AArch64] cls.ll - regenerate test checks (llvm#175948)

94f8e15

Noticed when reviewing llvm#174824

BStott6 pushed a commit to BStott6/llvm-project that referenced this pull request Jan 22, 2026

[AArch64] cls.ll - regenerate test checks (llvm#175948)

3cc755e

Noticed when reviewing llvm#174824

Provide feedback

Saved searches

Use saved searches to filter your results more quickly

[DAG] computeKnownBits - add CTLS handling#174824

[DAG] computeKnownBits - add CTLS handling#174824
RKSimon merged 9 commits intollvm:mainfrom
stomfaig:issue_174370

stomfaig commented Jan 7, 2026

Uh oh!

llvmbot commented Jan 7, 2026 •

edited

Loading

Uh oh!

Uh oh!

Uh oh!

github-actions bot commented Jan 7, 2026 •

edited

Loading

Uh oh!

topperc commented Jan 7, 2026

Uh oh!

github-actions bot commented Jan 8, 2026 •

edited

Loading

Uh oh!

Uh oh!

topperc left a comment

Uh oh!

RKSimon left a comment

Uh oh!

Uh oh!

Reviewers

Assignees

Labels

Projects

Milestone

Development

Uh oh!

4 participants

Conversation

stomfaig commented Jan 7, 2026

Uh oh!

llvmbot commented Jan 7, 2026 • edited Loading Uh oh! There was an error while loading. Please reload this page.

Uh oh!

Uh oh!

Uh oh!

Uh oh!

github-actions bot commented Jan 7, 2026 • edited Loading Uh oh! There was an error while loading. Please reload this page.

Uh oh!

🐧 Linux x64 Test Results

Uh oh!

topperc commented Jan 7, 2026

Uh oh!

github-actions bot commented Jan 8, 2026 • edited Loading Uh oh! There was an error while loading. Please reload this page.

Uh oh!

🪟 Windows x64 Test Results

Uh oh!

Uh oh!

topperc left a comment

Choose a reason for hiding this comment

Uh oh!

RKSimon left a comment

Choose a reason for hiding this comment

Uh oh!

Uh oh!

Reviewers

Assignees

Labels

Projects

Milestone

Development

Uh oh!

4 participants

llvmbot commented Jan 7, 2026 •

edited

Loading

github-actions bot commented Jan 7, 2026 •

edited

Loading

github-actions bot commented Jan 8, 2026 •

edited

Loading