[llvm-branch-commits] [llvm] release/20.x: [RISCV] Fix assertion failure when using -fstack-clash-protection (#135248) (PR #139388)
topperc wrote: @tstellar This is the fix. Can I push to this PR or do I need to make a new PR from my fork? ``` diff --git a/llvm/test/CodeGen/RISCV/pr135206.ll b/llvm/test/CodeGen/RISCV/pr135206.ll index 196e78d8ed8b..859179f62d70 100644 --- a/llvm/test/CodeGen/RISCV/pr135206.ll +++ b/llvm/test/CodeGen/RISCV/pr135206.ll @@ -44,7 +44,7 @@ define i1 @foo() nounwind "probe-stack"="inline-asm" "target-features"="+v" { ; CHECK-NEXT:lui a0, 8 ; CHECK-NEXT:addiw a0, a0, 32 ; CHECK-NEXT:add a0, sp, a0 -; CHECK-NEXT:vs1r.v v8, (a0) # vscale x 8-byte Folded Spill +; CHECK-NEXT:vs1r.v v8, (a0) # Unknown-size Folded Spill ; CHECK-NEXT:addiw a0, a1, 1622 ; CHECK-NEXT:vse8.v v8, (s0) ; CHECK-NEXT:vse8.v v8, (s1) @@ -56,7 +56,7 @@ define i1 @foo() nounwind "probe-stack"="inline-asm" "target-features"="+v" { ; CHECK-NEXT:lui a0, 8 ; CHECK-NEXT:addiw a0, a0, 32 ; CHECK-NEXT:add a0, sp, a0 -; CHECK-NEXT:vl1r.v v8, (a0) # vscale x 8-byte Folded Reload +; CHECK-NEXT:vl1r.v v8, (a0) # Unknown-size Folded Reload ; CHECK-NEXT:vsetivli zero, 16, e8, m1, ta, ma ; CHECK-NEXT:vse8.v v8, (s0) ; CHECK-NEXT:vse8.v v8, (s1) ``` https://github.com/llvm/llvm-project/pull/139388 ___ llvm-branch-commits mailing list llvm-branch-commits@lists.llvm.org https://lists.llvm.org/cgi-bin/mailman/listinfo/llvm-branch-commits
[llvm-branch-commits] [llvm] release/20.x: [RISCV] Fix assertion failure when using -fstack-clash-protection (#135248) (PR #139388)
tstellar wrote: It looks like there are some test failures with this backport. https://github.com/llvm/llvm-project/pull/139388 ___ llvm-branch-commits mailing list llvm-branch-commits@lists.llvm.org https://lists.llvm.org/cgi-bin/mailman/listinfo/llvm-branch-commits
[llvm-branch-commits] [llvm] release/20.x: [RISCV] Fix assertion failure when using -fstack-clash-protection (#135248) (PR #139388)
https://github.com/llvmbot milestoned https://github.com/llvm/llvm-project/pull/139388 ___ llvm-branch-commits mailing list llvm-branch-commits@lists.llvm.org https://lists.llvm.org/cgi-bin/mailman/listinfo/llvm-branch-commits
[llvm-branch-commits] [llvm] release/20.x: [RISCV] Fix assertion failure when using -fstack-clash-protection (#135248) (PR #139388)
eyestoreoye wrote: Very clean code with good test coverage. This is a great example of best practices. https://github.com/llvm/llvm-project/pull/139388 ___ llvm-branch-commits mailing list llvm-branch-commits@lists.llvm.org https://lists.llvm.org/cgi-bin/mailman/listinfo/llvm-branch-commits
[llvm-branch-commits] [llvm] release/20.x: [RISCV] Fix assertion failure when using -fstack-clash-protection (#135248) (PR #139388)
llvmbot wrote: @preames What do you think about merging this PR to the release branch? https://github.com/llvm/llvm-project/pull/139388 ___ llvm-branch-commits mailing list llvm-branch-commits@lists.llvm.org https://lists.llvm.org/cgi-bin/mailman/listinfo/llvm-branch-commits
[llvm-branch-commits] [llvm] release/20.x: [RISCV] Fix assertion failure when using -fstack-clash-protection (#135248) (PR #139388)
llvmbot wrote: @llvm/pr-subscribers-backend-risc-v Author: None (llvmbot) Changes Backport b3d2dc321c5c78b7204696afe07fe6ef3375acfd Requested by: @tstellar --- Full diff: https://github.com/llvm/llvm-project/pull/139388.diff 2 Files Affected: - (modified) llvm/lib/Target/RISCV/RISCVFrameLowering.cpp (+5-3) - (added) llvm/test/CodeGen/RISCV/pr135206.ll (+84) ``diff diff --git a/llvm/lib/Target/RISCV/RISCVFrameLowering.cpp b/llvm/lib/Target/RISCV/RISCVFrameLowering.cpp index bb2e5781c34db..6f4c1e16190f4 100644 --- a/llvm/lib/Target/RISCV/RISCVFrameLowering.cpp +++ b/llvm/lib/Target/RISCV/RISCVFrameLowering.cpp @@ -2135,11 +2135,13 @@ TargetStackID::Value RISCVFrameLowering::getStackIDForScalableVectors() const { } // Synthesize the probe loop. -static void emitStackProbeInline(MachineFunction &MF, MachineBasicBlock &MBB, - MachineBasicBlock::iterator MBBI, DebugLoc DL, +static void emitStackProbeInline(MachineBasicBlock::iterator MBBI, DebugLoc DL, Register TargetReg, bool IsRVV) { assert(TargetReg != RISCV::X2 && "New top of stack cannot already be in SP"); + MachineBasicBlock &MBB = *MBBI->getParent(); + MachineFunction &MF = *MBB.getParent(); + auto &Subtarget = MF.getSubtarget(); const RISCVInstrInfo *TII = Subtarget.getInstrInfo(); bool IsRV64 = Subtarget.is64Bit(); @@ -2228,7 +2230,7 @@ void RISCVFrameLowering::inlineStackProbe(MachineFunction &MF, MachineBasicBlock::iterator MBBI = MI->getIterator(); DebugLoc DL = MBB.findDebugLoc(MBBI); Register TargetReg = MI->getOperand(1).getReg(); - emitStackProbeInline(MF, MBB, MBBI, DL, TargetReg, + emitStackProbeInline(MBBI, DL, TargetReg, (MI->getOpcode() == RISCV::PROBED_STACKALLOC_RVV)); MBBI->eraseFromParent(); } diff --git a/llvm/test/CodeGen/RISCV/pr135206.ll b/llvm/test/CodeGen/RISCV/pr135206.ll new file mode 100644 index 0..196e78d8ed8b9 --- /dev/null +++ b/llvm/test/CodeGen/RISCV/pr135206.ll @@ -0,0 +1,84 @@ +; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py UTC_ARGS: --version 5 +; RUN: llc -mtriple riscv64 < %s -o - | FileCheck %s + +%"buff" = type { [4096 x i64] } + +declare void @llvm.memset.p0.i64(ptr, i8, i64, i1) +declare void @bar() + +define i1 @foo() nounwind "probe-stack"="inline-asm" "target-features"="+v" { +; CHECK-LABEL: foo: +; CHECK: # %bb.0: +; CHECK-NEXT:addi sp, sp, -2032 +; CHECK-NEXT:sd ra, 2024(sp) # 8-byte Folded Spill +; CHECK-NEXT:sd s0, 2016(sp) # 8-byte Folded Spill +; CHECK-NEXT:sd s1, 2008(sp) # 8-byte Folded Spill +; CHECK-NEXT:sd s2, 2000(sp) # 8-byte Folded Spill +; CHECK-NEXT:sd s3, 1992(sp) # 8-byte Folded Spill +; CHECK-NEXT:lui a0, 7 +; CHECK-NEXT:sub t1, sp, a0 +; CHECK-NEXT:lui t2, 1 +; CHECK-NEXT: .LBB0_1: # =>This Inner Loop Header: Depth=1 +; CHECK-NEXT:sub sp, sp, t2 +; CHECK-NEXT:sd zero, 0(sp) +; CHECK-NEXT:bne sp, t1, .LBB0_1 +; CHECK-NEXT: # %bb.2: +; CHECK-NEXT:addi sp, sp, -2048 +; CHECK-NEXT:addi sp, sp, -96 +; CHECK-NEXT:csrr t1, vlenb +; CHECK-NEXT:lui t2, 1 +; CHECK-NEXT: .LBB0_3: # =>This Inner Loop Header: Depth=1 +; CHECK-NEXT:sub sp, sp, t2 +; CHECK-NEXT:sd zero, 0(sp) +; CHECK-NEXT:sub t1, t1, t2 +; CHECK-NEXT:bge t1, t2, .LBB0_3 +; CHECK-NEXT: # %bb.4: +; CHECK-NEXT:sub sp, sp, t1 +; CHECK-NEXT:li a0, 86 +; CHECK-NEXT:addi s0, sp, 48 +; CHECK-NEXT:addi s1, sp, 32 +; CHECK-NEXT:addi s2, sp, 16 +; CHECK-NEXT:lui a1, 353637 +; CHECK-NEXT:vsetivli zero, 16, e8, m1, ta, ma +; CHECK-NEXT:vmv.v.x v8, a0 +; CHECK-NEXT:lui a0, 8 +; CHECK-NEXT:addiw a0, a0, 32 +; CHECK-NEXT:add a0, sp, a0 +; CHECK-NEXT:vs1r.v v8, (a0) # vscale x 8-byte Folded Spill +; CHECK-NEXT:addiw a0, a1, 1622 +; CHECK-NEXT:vse8.v v8, (s0) +; CHECK-NEXT:vse8.v v8, (s1) +; CHECK-NEXT:vse8.v v8, (s2) +; CHECK-NEXT:slli a1, a0, 32 +; CHECK-NEXT:add s3, a0, a1 +; CHECK-NEXT:sd s3, 64(sp) +; CHECK-NEXT:call bar +; CHECK-NEXT:lui a0, 8 +; CHECK-NEXT:addiw a0, a0, 32 +; CHECK-NEXT:add a0, sp, a0 +; CHECK-NEXT:vl1r.v v8, (a0) # vscale x 8-byte Folded Reload +; CHECK-NEXT:vsetivli zero, 16, e8, m1, ta, ma +; CHECK-NEXT:vse8.v v8, (s0) +; CHECK-NEXT:vse8.v v8, (s1) +; CHECK-NEXT:vse8.v v8, (s2) +; CHECK-NEXT:sd s3, 64(sp) +; CHECK-NEXT:li a0, 0 +; CHECK-NEXT:csrr a1, vlenb +; CHECK-NEXT:add sp, sp, a1 +; CHECK-NEXT:lui a1, 8 +; CHECK-NEXT:addiw a1, a1, -1952 +; CHECK-NEXT:add sp, sp, a1 +; CHECK-NEXT:ld ra, 2024(sp) # 8-byte Folded Reload +; CHECK-NEXT:ld s0, 2016(sp) # 8-byte Folded Reload +; CHECK-NEXT:ld s1, 2008(sp) # 8-byte Folded Reload +; CHECK-NEXT:ld s2, 2000(sp) # 8-byte Folded Reload +; CHECK-NEXT:ld s3, 1992(sp) # 8-byte Folded Reload +; CHECK-NEXT:addi sp,
[llvm-branch-commits] [llvm] release/20.x: [RISCV] Fix assertion failure when using -fstack-clash-protection (#135248) (PR #139388)
https://github.com/llvmbot created https://github.com/llvm/llvm-project/pull/139388 Backport b3d2dc321c5c78b7204696afe07fe6ef3375acfd Requested by: @tstellar >From ff4132ec328ed80be247856939dbf7345106cc55 Mon Sep 17 00:00:00 2001 From: Paul Kirth Date: Fri, 18 Apr 2025 09:12:52 -0700 Subject: [PATCH] [RISCV] Fix assertion failure when using -fstack-clash-protection (#135248) We can't assume MBBI is still pointing at MBB if we've already expanded a probe. We need to re-query the MBB from MBBI. Fixes #135206 Co-authored-by: Craig Topper (cherry picked from commit b3d2dc321c5c78b7204696afe07fe6ef3375acfd) --- llvm/lib/Target/RISCV/RISCVFrameLowering.cpp | 8 +- llvm/test/CodeGen/RISCV/pr135206.ll | 84 2 files changed, 89 insertions(+), 3 deletions(-) create mode 100644 llvm/test/CodeGen/RISCV/pr135206.ll diff --git a/llvm/lib/Target/RISCV/RISCVFrameLowering.cpp b/llvm/lib/Target/RISCV/RISCVFrameLowering.cpp index bb2e5781c34db..6f4c1e16190f4 100644 --- a/llvm/lib/Target/RISCV/RISCVFrameLowering.cpp +++ b/llvm/lib/Target/RISCV/RISCVFrameLowering.cpp @@ -2135,11 +2135,13 @@ TargetStackID::Value RISCVFrameLowering::getStackIDForScalableVectors() const { } // Synthesize the probe loop. -static void emitStackProbeInline(MachineFunction &MF, MachineBasicBlock &MBB, - MachineBasicBlock::iterator MBBI, DebugLoc DL, +static void emitStackProbeInline(MachineBasicBlock::iterator MBBI, DebugLoc DL, Register TargetReg, bool IsRVV) { assert(TargetReg != RISCV::X2 && "New top of stack cannot already be in SP"); + MachineBasicBlock &MBB = *MBBI->getParent(); + MachineFunction &MF = *MBB.getParent(); + auto &Subtarget = MF.getSubtarget(); const RISCVInstrInfo *TII = Subtarget.getInstrInfo(); bool IsRV64 = Subtarget.is64Bit(); @@ -2228,7 +2230,7 @@ void RISCVFrameLowering::inlineStackProbe(MachineFunction &MF, MachineBasicBlock::iterator MBBI = MI->getIterator(); DebugLoc DL = MBB.findDebugLoc(MBBI); Register TargetReg = MI->getOperand(1).getReg(); - emitStackProbeInline(MF, MBB, MBBI, DL, TargetReg, + emitStackProbeInline(MBBI, DL, TargetReg, (MI->getOpcode() == RISCV::PROBED_STACKALLOC_RVV)); MBBI->eraseFromParent(); } diff --git a/llvm/test/CodeGen/RISCV/pr135206.ll b/llvm/test/CodeGen/RISCV/pr135206.ll new file mode 100644 index 0..196e78d8ed8b9 --- /dev/null +++ b/llvm/test/CodeGen/RISCV/pr135206.ll @@ -0,0 +1,84 @@ +; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py UTC_ARGS: --version 5 +; RUN: llc -mtriple riscv64 < %s -o - | FileCheck %s + +%"buff" = type { [4096 x i64] } + +declare void @llvm.memset.p0.i64(ptr, i8, i64, i1) +declare void @bar() + +define i1 @foo() nounwind "probe-stack"="inline-asm" "target-features"="+v" { +; CHECK-LABEL: foo: +; CHECK: # %bb.0: +; CHECK-NEXT:addi sp, sp, -2032 +; CHECK-NEXT:sd ra, 2024(sp) # 8-byte Folded Spill +; CHECK-NEXT:sd s0, 2016(sp) # 8-byte Folded Spill +; CHECK-NEXT:sd s1, 2008(sp) # 8-byte Folded Spill +; CHECK-NEXT:sd s2, 2000(sp) # 8-byte Folded Spill +; CHECK-NEXT:sd s3, 1992(sp) # 8-byte Folded Spill +; CHECK-NEXT:lui a0, 7 +; CHECK-NEXT:sub t1, sp, a0 +; CHECK-NEXT:lui t2, 1 +; CHECK-NEXT: .LBB0_1: # =>This Inner Loop Header: Depth=1 +; CHECK-NEXT:sub sp, sp, t2 +; CHECK-NEXT:sd zero, 0(sp) +; CHECK-NEXT:bne sp, t1, .LBB0_1 +; CHECK-NEXT: # %bb.2: +; CHECK-NEXT:addi sp, sp, -2048 +; CHECK-NEXT:addi sp, sp, -96 +; CHECK-NEXT:csrr t1, vlenb +; CHECK-NEXT:lui t2, 1 +; CHECK-NEXT: .LBB0_3: # =>This Inner Loop Header: Depth=1 +; CHECK-NEXT:sub sp, sp, t2 +; CHECK-NEXT:sd zero, 0(sp) +; CHECK-NEXT:sub t1, t1, t2 +; CHECK-NEXT:bge t1, t2, .LBB0_3 +; CHECK-NEXT: # %bb.4: +; CHECK-NEXT:sub sp, sp, t1 +; CHECK-NEXT:li a0, 86 +; CHECK-NEXT:addi s0, sp, 48 +; CHECK-NEXT:addi s1, sp, 32 +; CHECK-NEXT:addi s2, sp, 16 +; CHECK-NEXT:lui a1, 353637 +; CHECK-NEXT:vsetivli zero, 16, e8, m1, ta, ma +; CHECK-NEXT:vmv.v.x v8, a0 +; CHECK-NEXT:lui a0, 8 +; CHECK-NEXT:addiw a0, a0, 32 +; CHECK-NEXT:add a0, sp, a0 +; CHECK-NEXT:vs1r.v v8, (a0) # vscale x 8-byte Folded Spill +; CHECK-NEXT:addiw a0, a1, 1622 +; CHECK-NEXT:vse8.v v8, (s0) +; CHECK-NEXT:vse8.v v8, (s1) +; CHECK-NEXT:vse8.v v8, (s2) +; CHECK-NEXT:slli a1, a0, 32 +; CHECK-NEXT:add s3, a0, a1 +; CHECK-NEXT:sd s3, 64(sp) +; CHECK-NEXT:call bar +; CHECK-NEXT:lui a0, 8 +; CHECK-NEXT:addiw a0, a0, 32 +; CHECK-NEXT:add a0, sp, a0 +; CHECK-NEXT:vl1r.v v8, (a0) # vscale x 8-byte Folded Reload +; CHECK-NEXT:vsetivli zero, 16, e8, m1, ta, ma +; CHECK-NEXT:vse8.v v8, (s0) +; CHECK-NEXT:vse8.v v8, (s1) +; CHECK-NEXT:vse8.v v8, (s2) +; CHECK-NEXT:sd s3, 64(sp) +; CHECK-NEXT:li a0, 0 +; CHECK-NEX