[DAGCombiner] Fix the "subtraction if above a constant threshold" miscompile #140042

pfusik · May 15, 2025

This fixes #135194 incorrectly reusing the existing add nuw/nsw
while the transformed code relies on an unsigned wrap.

llvmbot · May 15, 2025

@llvm/pr-subscribers-llvm-selectiondag

Author: Piotr Fusik (pfusik)

Changes

This fixes #135194 incorrectly leaving add nuw/nsw while an unsigned wrap is expected.

Full diff: https://github.com/llvm/llvm-project/pull/140042.diff

3 Files Affected:

(modified) llvm/lib/CodeGen/SelectionDAG/DAGCombiner.cpp (+8-4)
(modified) llvm/test/CodeGen/RISCV/rv32zbb.ll (+26-5)
(modified) llvm/test/CodeGen/RISCV/rv64zbb.ll (+6-6)

diff --git a/llvm/lib/CodeGen/SelectionDAG/DAGCombiner.cpp b/llvm/lib/CodeGen/SelectionDAG/DAGCombiner.cpp
index d6e288a59b2ee..fc7295c0bc1db 100644
--- a/llvm/lib/CodeGen/SelectionDAG/DAGCombiner.cpp
+++ b/llvm/lib/CodeGen/SelectionDAG/DAGCombiner.cpp
@@ -12136,15 +12136,19 @@ SDValue DAGCombiner::visitSELECT(SDNode *N) {
     if (SDValue NewSel = SimplifySelect(DL, N0, N1, N2))
       return NewSel;
 
-    // (select (ugt x, C), (add x, ~C), x) -> (umin (add x, ~C), x)
+    // (select (ugt x, C), (add x, ~C), x) -> (umin x, (add x, ~C))
     // (select (ult x, C), x, (add x, -C)) -> (umin x, (add x, -C))
     APInt C;
     if (sd_match(Cond1, m_ConstInt(C)) && hasUMin(VT)) {
+      APInt AddC;
       if ((CC == ISD::SETUGT && Cond0 == N2 &&
-           sd_match(N1, m_Add(m_Specific(N2), m_SpecificInt(~C)))) ||
+           sd_match(N1, m_Add(m_Specific(N2), m_ConstInt(AddC))) &&
+           AddC == ~C) ||
           (CC == ISD::SETULT && Cond0 == N1 &&
-           sd_match(N2, m_Add(m_Specific(N1), m_SpecificInt(-C)))))
-        return DAG.getNode(ISD::UMIN, DL, VT, N1, N2);
+           sd_match(N2, m_Add(m_Specific(N1), m_ConstInt(AddC))) && AddC == -C))
+        return DAG.getNode(ISD::UMIN, DL, VT, Cond0,
+                           DAG.getNode(ISD::ADD, DL, VT, Cond0,
+                                       DAG.getConstant(AddC, DL, VT)));
     }
   }
 
diff --git a/llvm/test/CodeGen/RISCV/rv32zbb.ll b/llvm/test/CodeGen/RISCV/rv32zbb.ll
index 0f2284637ca6a..0a3729b3de6b6 100644
--- a/llvm/test/CodeGen/RISCV/rv32zbb.ll
+++ b/llvm/test/CodeGen/RISCV/rv32zbb.ll
@@ -1742,7 +1742,7 @@ define i8 @sub_if_uge_C_i8(i8 zeroext %x) {
 ; RV32ZBB:       # %bb.0:
 ; RV32ZBB-NEXT:    addi a1, a0, -13
 ; RV32ZBB-NEXT:    zext.b a1, a1
-; RV32ZBB-NEXT:    minu a0, a1, a0
+; RV32ZBB-NEXT:    minu a0, a0, a1
 ; RV32ZBB-NEXT:    ret
   %cmp = icmp ugt i8 %x, 12
   %sub = add i8 %x, -13
@@ -1763,7 +1763,7 @@ define i16 @sub_if_uge_C_i16(i16 zeroext %x) {
 ; RV32ZBB:       # %bb.0:
 ; RV32ZBB-NEXT:    addi a1, a0, -251
 ; RV32ZBB-NEXT:    zext.h a1, a1
-; RV32ZBB-NEXT:    minu a0, a1, a0
+; RV32ZBB-NEXT:    minu a0, a0, a1
 ; RV32ZBB-NEXT:    ret
   %cmp = icmp ugt i16 %x, 250
   %sub = add i16 %x, -251
@@ -1789,7 +1789,7 @@ define i32 @sub_if_uge_C_i32(i32 signext %x) {
 ; RV32ZBB-NEXT:    lui a1, 1048560
 ; RV32ZBB-NEXT:    addi a1, a1, 15
 ; RV32ZBB-NEXT:    add a1, a0, a1
-; RV32ZBB-NEXT:    minu a0, a1, a0
+; RV32ZBB-NEXT:    minu a0, a0, a1
 ; RV32ZBB-NEXT:    ret
   %cmp = icmp ugt i32 %x, 65520
   %sub = add i32 %x, -65521
@@ -1850,7 +1850,7 @@ define i32 @sub_if_uge_C_multiuse_cmp_i32(i32 signext %x, ptr %z) {
 ; RV32ZBB-NEXT:    addi a3, a3, 15
 ; RV32ZBB-NEXT:    sltu a2, a2, a0
 ; RV32ZBB-NEXT:    add a3, a0, a3
-; RV32ZBB-NEXT:    minu a0, a3, a0
+; RV32ZBB-NEXT:    minu a0, a0, a3
 ; RV32ZBB-NEXT:    sw a2, 0(a1)
 ; RV32ZBB-NEXT:    ret
   %cmp = icmp ugt i32 %x, 65520
@@ -1882,7 +1882,7 @@ define i32 @sub_if_uge_C_multiuse_sub_i32(i32 signext %x, ptr %z) {
 ; RV32ZBB-NEXT:    lui a2, 1048560
 ; RV32ZBB-NEXT:    addi a2, a2, 15
 ; RV32ZBB-NEXT:    add a2, a0, a2
-; RV32ZBB-NEXT:    minu a0, a2, a0
+; RV32ZBB-NEXT:    minu a0, a0, a2
 ; RV32ZBB-NEXT:    sw a2, 0(a1)
 ; RV32ZBB-NEXT:    ret
   %sub = add i32 %x, -65521
@@ -1917,3 +1917,24 @@ define i32 @sub_if_uge_C_swapped_i32(i32 %x) {
   %cond = select i1 %cmp, i32 %x, i32 %sub
   ret i32 %cond
 }
+
+define noundef i8 @sub_if_uge_C_nsw_i8(i8 zeroext %x) {
+; RV32I-LABEL: sub_if_uge_C_nsw_i8:
+; RV32I:       # %bb.0:
+; RV32I-NEXT:    sltiu a1, a0, 13
+; RV32I-NEXT:    addi a1, a1, -1
+; RV32I-NEXT:    andi a1, a1, -13
+; RV32I-NEXT:    add a0, a0, a1
+; RV32I-NEXT:    ret
+;
+; RV32ZBB-LABEL: sub_if_uge_C_nsw_i8:
+; RV32ZBB:       # %bb.0:
+; RV32ZBB-NEXT:    addi a1, a0, -13
+; RV32ZBB-NEXT:    zext.b a1, a1
+; RV32ZBB-NEXT:    minu a0, a0, a1
+; RV32ZBB-NEXT:    ret
+  %cmp = icmp ugt i8 %x, 12
+  %sub = add nsw i8 %x, -13
+  %conv4 = select i1 %cmp, i8 %sub, i8 %x
+  ret i8 %conv4
+}
diff --git a/llvm/test/CodeGen/RISCV/rv64zbb.ll b/llvm/test/CodeGen/RISCV/rv64zbb.ll
index 17eb0817d548a..1faafbe8b8187 100644
--- a/llvm/test/CodeGen/RISCV/rv64zbb.ll
+++ b/llvm/test/CodeGen/RISCV/rv64zbb.ll
@@ -1898,7 +1898,7 @@ define i8 @sub_if_uge_C_i8(i8 zeroext %x) {
 ; RV64ZBB:       # %bb.0:
 ; RV64ZBB-NEXT:    addi a1, a0, -13
 ; RV64ZBB-NEXT:    zext.b a1, a1
-; RV64ZBB-NEXT:    minu a0, a1, a0
+; RV64ZBB-NEXT:    minu a0, a0, a1
 ; RV64ZBB-NEXT:    ret
   %cmp = icmp ugt i8 %x, 12
   %sub = add i8 %x, -13
@@ -1919,7 +1919,7 @@ define i16 @sub_if_uge_C_i16(i16 zeroext %x) {
 ; RV64ZBB:       # %bb.0:
 ; RV64ZBB-NEXT:    addi a1, a0, -251
 ; RV64ZBB-NEXT:    zext.h a1, a1
-; RV64ZBB-NEXT:    minu a0, a1, a0
+; RV64ZBB-NEXT:    minu a0, a0, a1
 ; RV64ZBB-NEXT:    ret
   %cmp = icmp ugt i16 %x, 250
   %sub = add i16 %x, -251
@@ -1945,7 +1945,7 @@ define i32 @sub_if_uge_C_i32(i32 signext %x) {
 ; RV64ZBB-NEXT:    lui a1, 1048560
 ; RV64ZBB-NEXT:    addi a1, a1, 15
 ; RV64ZBB-NEXT:    addw a1, a0, a1
-; RV64ZBB-NEXT:    minu a0, a1, a0
+; RV64ZBB-NEXT:    minu a0, a0, a1
 ; RV64ZBB-NEXT:    ret
   %cmp = icmp ugt i32 %x, 65520
   %sub = add i32 %x, -65521
@@ -1975,7 +1975,7 @@ define i64 @sub_if_uge_C_i64(i64 %x) {
 ; RV64ZBB-NEXT:    addiw a1, a1, -761
 ; RV64ZBB-NEXT:    slli a1, a1, 9
 ; RV64ZBB-NEXT:    add a1, a0, a1
-; RV64ZBB-NEXT:    minu a0, a1, a0
+; RV64ZBB-NEXT:    minu a0, a0, a1
 ; RV64ZBB-NEXT:    ret
   %cmp = icmp ugt i64 %x, 4999999999
   %sub = add i64 %x, -5000000000
@@ -2005,7 +2005,7 @@ define i32 @sub_if_uge_C_multiuse_cmp_i32(i32 signext %x, ptr %z) {
 ; RV64ZBB-NEXT:    addi a3, a3, 15
 ; RV64ZBB-NEXT:    sltu a2, a2, a0
 ; RV64ZBB-NEXT:    addw a3, a0, a3
-; RV64ZBB-NEXT:    minu a0, a3, a0
+; RV64ZBB-NEXT:    minu a0, a0, a3
 ; RV64ZBB-NEXT:    sw a2, 0(a1)
 ; RV64ZBB-NEXT:    ret
   %cmp = icmp ugt i32 %x, 65520
@@ -2037,7 +2037,7 @@ define i32 @sub_if_uge_C_multiuse_sub_i32(i32 signext %x, ptr %z) {
 ; RV64ZBB-NEXT:    lui a2, 1048560
 ; RV64ZBB-NEXT:    addi a2, a2, 15
 ; RV64ZBB-NEXT:    addw a2, a0, a2
-; RV64ZBB-NEXT:    minu a0, a2, a0
+; RV64ZBB-NEXT:    minu a0, a0, a2
 ; RV64ZBB-NEXT:    sw a2, 0(a1)
 ; RV64ZBB-NEXT:    ret
   %sub = add i32 %x, -65521

pfusik · May 15, 2025

llvm/test/CodeGen/RISCV/rv32zbb.ll

+define noundef i8 @sub_if_uge_C_nsw_i8(i8 zeroext %x) {
+; RV32I-LABEL: sub_if_uge_C_nsw_i8:
+; RV32I:       # %bb.0:
+; RV32I-NEXT:    sltiu a1, a0, 13
+; RV32I-NEXT:    addi a1, a1, -1
+; RV32I-NEXT:    andi a1, a1, -13
+; RV32I-NEXT:    add a0, a0, a1
+; RV32I-NEXT:    ret
+;
+; RV32ZBB-LABEL: sub_if_uge_C_nsw_i8:
+; RV32ZBB:       # %bb.0:
+; RV32ZBB-NEXT:    addi a1, a0, -13
+; RV32ZBB-NEXT:    zext.b a1, a1
+; RV32ZBB-NEXT:    minu a0, a0, a1
+; RV32ZBB-NEXT:    ret
+  %cmp = icmp ugt i8 %x, 12
+  %sub = add nsw i8 %x, -13
+  %conv4 = select i1 %cmp, i8 %sub, i8 %x
+  ret i8 %conv4
+}


This doesn't test this fix. How to test?

I think this might do the trick (at least for the ult variant):

define i7 @src(i7 %a) { %x = or i7 %a, 51 %c = icmp ult i7 %x, -17 %add = add nsw i7 %x, 17 %s = select i1 %c, i7 %x, i7 %add ret i7 %s }

RKSimon · May 15, 2025

llvm/lib/CodeGen/SelectionDAG/DAGCombiner.cpp

+           sd_match(N2, m_Add(m_Specific(N1), m_ConstInt(AddC))) && AddC == -C))
+        return DAG.getNode(ISD::UMIN, DL, VT, Cond0,
+                           DAG.getNode(ISD::ADD, DL, VT, Cond0,
+                                       DAG.getConstant(AddC, DL, VT)));


It might be cleaner just to split these and then do:

if (CC == ISD::SETULT && Cond0 == N1 && sd_match(N2, m_Add(m_Specific(N1), m_SpecificInt(-C)))) return DAG.getNode(ISD::UMIN, DL, VT, Cond0, DAG.getNode(ISD::ADD, DL, VT, Cond0, DAG.getConstant(-C, DL, VT)));

etc.

topperc · May 15, 2025

~~Isn't this only one possible problem? Don't we need a freeze?~~

Nevermind, I guess if x is poison, the select result was already poison so its only the add that needs to be fixed.

arsenm · May 16, 2025

llvm/lib/CodeGen/SelectionDAG/DAGCombiner.cpp

-           sd_match(N2, m_Add(m_Specific(N1), m_SpecificInt(-C)))))
-        return DAG.getNode(ISD::UMIN, DL, VT, N1, N2);
+      if (CC == ISD::SETUGT && Cond0 == N2 &&
+          sd_match(N1, m_Add(m_Specific(N2), m_SpecificInt(~C))))


Braces, and/or use some temporary values to reduce this ugly wrapping

…" miscompile

…compile This fixes llvm#135194 incorrectly reusing the existing `add nuw/nsw` while the transformed code relies on an unsigned wrap.

bjope · May 16, 2025

llvm/lib/CodeGen/SelectionDAG/DAGCombiner.cpp

@@ -12140,11 +12140,16 @@ SDValue DAGCombiner::visitSELECT(SDNode *N) {
    // (select (ult x, C), x, (add x, -C)) -> (umin x, (add x, -C))
    APInt C;
    if (sd_match(Cond1, m_ConstInt(C)) && hasUMin(VT)) {


nit: Could add a small comment here telling why we need to recreate the ADD. Just to avoid that someone tries to simplify this in the future, or if someone wonder why we can do this without introducing FREEZE.

Maybe something like this:
// Need to drop any poison generating flags from the ADD, to ensure that the result isn't more poisonous.

bjope

LGTM, thanks!

…mpile (llvm#140042) This fixes llvm#135194 incorrectly reusing the existing `add nuw/nsw` while the transformed code relies on an unsigned wrap.

llvmbot added the llvm:SelectionDAG SelectionDAGISel as well label May 15, 2025

pfusik mentioned this pull request May 15, 2025

[DAGCombiner] Fold subtraction if above a constant threshold to umin #135194

Merged

pfusik commented May 15, 2025

View reviewed changes

RKSimon reviewed May 15, 2025

View reviewed changes

RKSimon requested a review from bjope May 15, 2025 12:03

arsenm reviewed May 16, 2025

View reviewed changes

pfusik added 2 commits May 16, 2025 10:56

[RISCV][test] Add test for "subtraction if above a constant threshold…

fd9fa66

…" miscompile

[DAGCombiner] Fix the "subtraction if above a constant threshold" mis…

f052064

…compile This fixes llvm#135194 incorrectly reusing the existing `add nuw/nsw` while the transformed code relies on an unsigned wrap.

pfusik force-pushed the sub-minu-c-poison branch from 8d79331 to f052064 Compare May 16, 2025 09:03

pfusik changed the title ~~[DAGCombiner] Fix the "subtraction if above a constant threshold" transform~~ [DAGCombiner] Fix the "subtraction if above a constant threshold" miscompile May 16, 2025

[DAGCombiner] Prettify with braces and temporaries

74ca22c

bjope reviewed May 16, 2025

View reviewed changes

[DAGCombiner] Explain why we recreate ADD

b61f74e

bjope approved these changes May 16, 2025

View reviewed changes

pfusik merged commit 9e22f96 into llvm:main May 17, 2025
11 checks passed

Provide feedback

Saved searches

Use saved searches to filter your results more quickly

Uh oh!

[DAGCombiner] Fix the "subtraction if above a constant threshold" miscompile #140042

[DAGCombiner] Fix the "subtraction if above a constant threshold" miscompile #140042

Uh oh!

pfusik commented May 15, 2025 •

edited

Loading

Uh oh!

llvmbot commented May 15, 2025

Uh oh!

pfusik May 15, 2025

Uh oh!

bjope May 15, 2025

Uh oh!

RKSimon May 15, 2025

Uh oh!

pfusik May 15, 2025

Uh oh!

topperc commented May 15, 2025 •

edited

Loading

Uh oh!

arsenm May 16, 2025

Uh oh!

pfusik May 16, 2025

Uh oh!

bjope May 16, 2025

Uh oh!

pfusik May 16, 2025

Uh oh!

bjope left a comment

Uh oh!

Uh oh!

Uh oh!

Search code, repositories, users, issues, pull requests...

[DAGCombiner] Fix the "subtraction if above a constant threshold" miscompile #140042

[DAGCombiner] Fix the "subtraction if above a constant threshold" miscompile #140042

Uh oh!

Conversation

pfusik commented May 15, 2025 • edited Loading Uh oh! There was an error while loading. Please reload this page.

Uh oh!

Uh oh!

llvmbot commented May 15, 2025

Uh oh!

Choose a reason for hiding this comment

Uh oh!

Choose a reason for hiding this comment

Uh oh!

Choose a reason for hiding this comment

Uh oh!

Choose a reason for hiding this comment

Uh oh!

topperc commented May 15, 2025 • edited Loading Uh oh! There was an error while loading. Please reload this page.

Uh oh!

Uh oh!

Choose a reason for hiding this comment

Uh oh!

Choose a reason for hiding this comment

Uh oh!

Choose a reason for hiding this comment

Uh oh!

Choose a reason for hiding this comment

Uh oh!

bjope left a comment

Choose a reason for hiding this comment

Uh oh!

Uh oh!

Uh oh!

pfusik commented May 15, 2025 •

edited

Loading

topperc commented May 15, 2025 •

edited

Loading