Skip to content

Commit 29c98e5

Browse files
committed
Revert "[Inline][Cloning] Defer simplification after phi-nodes resolution" #87963
Reopens #87534. Breaks multiple bots: https://lab.llvm.org/buildbot/#/builders/168/builds/20028 https://lab.llvm.org/buildbot/#/builders/74/builds/27773 And reproducer in a61f9fe. This reverts commit a61f9fe.
1 parent 69bde04 commit 29c98e5

File tree

4 files changed

+61
-39
lines changed

4 files changed

+61
-39
lines changed

llvm/lib/Transforms/Utils/CloneFunction.cpp

Lines changed: 57 additions & 35 deletions
Original file line numberDiff line numberDiff line change
@@ -14,7 +14,6 @@
1414

1515
#include "llvm/ADT/SetVector.h"
1616
#include "llvm/ADT/SmallVector.h"
17-
#include "llvm/Analysis/ConstantFolding.h"
1817
#include "llvm/Analysis/DomTreeUpdater.h"
1918
#include "llvm/Analysis/InstructionSimplify.h"
2019
#include "llvm/Analysis/LoopInfo.h"
@@ -541,13 +540,18 @@ void PruningFunctionCloner::CloneBlock(
541540
RemapInstruction(NewInst, VMap,
542541
ModuleLevelChanges ? RF_None : RF_NoModuleLevelChanges);
543542

544-
// Eagerly constant fold the newly cloned instruction. If successful, add
545-
// a mapping to the new value. Non-constant operands may be incomplete at
546-
// this stage, thus instruction simplification is performed after
547-
// processing phi-nodes.
548-
if (Value *V = ConstantFoldInstruction(
549-
NewInst, BB->getModule()->getDataLayout())) {
550-
if (isInstructionTriviallyDead(NewInst)) {
543+
// If we can simplify this instruction to some other value, simply add
544+
// a mapping to that value rather than inserting a new instruction into
545+
// the basic block.
546+
if (Value *V =
547+
simplifyInstruction(NewInst, BB->getModule()->getDataLayout())) {
548+
// On the off-chance that this simplifies to an instruction in the old
549+
// function, map it back into the new function.
550+
if (NewFunc != OldFunc)
551+
if (Value *MappedV = VMap.lookup(V))
552+
V = MappedV;
553+
554+
if (!NewInst->mayHaveSideEffects()) {
551555
VMap[&*II] = V;
552556
NewInst->eraseFromParent();
553557
continue;
@@ -819,34 +823,52 @@ void llvm::CloneAndPruneIntoFromInst(Function *NewFunc, const Function *OldFunc,
819823
}
820824
}
821825

822-
// As phi-nodes have been now remapped, allow incremental simplification of
823-
// newly-cloned instructions.
826+
// Make a second pass over the PHINodes now that all of them have been
827+
// remapped into the new function, simplifying the PHINode and performing any
828+
// recursive simplifications exposed. This will transparently update the
829+
// WeakTrackingVH in the VMap. Notably, we rely on that so that if we coalesce
830+
// two PHINodes, the iteration over the old PHIs remains valid, and the
831+
// mapping will just map us to the new node (which may not even be a PHI
832+
// node).
824833
const DataLayout &DL = NewFunc->getParent()->getDataLayout();
825-
for (const auto &BB : *OldFunc) {
826-
for (const auto &I : BB) {
827-
auto *NewI = dyn_cast_or_null<Instruction>(VMap.lookup(&I));
828-
if (!NewI)
829-
continue;
830-
831-
// Skip over non-intrinsic callsites, we don't want to remove any nodes
832-
// from the CGSCC.
833-
CallBase *CB = dyn_cast<CallBase>(NewI);
834-
if (CB && CB->getCalledFunction() &&
835-
!CB->getCalledFunction()->isIntrinsic())
836-
continue;
837-
838-
if (Value *V = simplifyInstruction(NewI, DL)) {
839-
NewI->replaceAllUsesWith(V);
840-
841-
if (isInstructionTriviallyDead(NewI)) {
842-
NewI->eraseFromParent();
843-
} else {
844-
// Did not erase it? Restore the new instruction into VMap previously
845-
// dropped by `ValueIsRAUWd`.
846-
VMap[&I] = NewI;
847-
}
848-
}
849-
}
834+
SmallSetVector<const Value *, 8> Worklist;
835+
for (unsigned Idx = 0, Size = PHIToResolve.size(); Idx != Size; ++Idx)
836+
if (isa<PHINode>(VMap[PHIToResolve[Idx]]))
837+
Worklist.insert(PHIToResolve[Idx]);
838+
839+
// Note that we must test the size on each iteration, the worklist can grow.
840+
for (unsigned Idx = 0; Idx != Worklist.size(); ++Idx) {
841+
const Value *OrigV = Worklist[Idx];
842+
auto *I = dyn_cast_or_null<Instruction>(VMap.lookup(OrigV));
843+
if (!I)
844+
continue;
845+
846+
// Skip over non-intrinsic callsites, we don't want to remove any nodes from
847+
// the CGSCC.
848+
CallBase *CB = dyn_cast<CallBase>(I);
849+
if (CB && CB->getCalledFunction() &&
850+
!CB->getCalledFunction()->isIntrinsic())
851+
continue;
852+
853+
// See if this instruction simplifies.
854+
Value *SimpleV = simplifyInstruction(I, DL);
855+
if (!SimpleV)
856+
continue;
857+
858+
// Stash away all the uses of the old instruction so we can check them for
859+
// recursive simplifications after a RAUW. This is cheaper than checking all
860+
// uses of To on the recursive step in most cases.
861+
for (const User *U : OrigV->users())
862+
Worklist.insert(cast<Instruction>(U));
863+
864+
// Replace the instruction with its simplified value.
865+
I->replaceAllUsesWith(SimpleV);
866+
867+
// If the original instruction had no side effects, remove it.
868+
if (isInstructionTriviallyDead(I))
869+
I->eraseFromParent();
870+
else
871+
VMap[OrigV] = I;
850872
}
851873

852874
// Remap debug intrinsic operands now that all values have been mapped.

llvm/test/Transforms/Inline/inline-deferred-instsimplify.ll

Lines changed: 2 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -38,6 +38,8 @@ store_ptr_in_gvar: ; preds = %entry
3838

3939
check_pointers_are_equal: ; preds = %store_ptr_in_gvar, %entry
4040
%phi = phi ptr [ %ptr, %store_ptr_in_gvar ], [ @other_g_var, %entry ]
41+
; FIXME: While inlining, the following is miscompiled to i1 false,
42+
; as %ptr in the phi-node is not taken into account.
4143
%.not1 = icmp eq ptr %phi, %ptr
4244
br i1 %.not1, label %return, label %abort
4345

@@ -62,13 +64,9 @@ define i32 @main() {
6264
; CHECK-NEXT: br label [[CHECK_POINTERS_ARE_EQUAL_I]]
6365
; CHECK: check_pointers_are_equal.i:
6466
; CHECK-NEXT: [[PHI_I:%.*]] = phi ptr [ [[G_VAR]], [[STORE_PTR_IN_GVAR_I]] ], [ @other_g_var, [[TMP0:%.*]] ]
65-
; CHECK-NEXT: [[DOTNOT1_I:%.*]] = icmp eq ptr [[PHI_I]], [[G_VAR]]
66-
; CHECK-NEXT: br i1 [[DOTNOT1_I]], label [[CALLEE_EXIT:%.*]], label [[ABORT_I:%.*]]
67-
; CHECK: abort.i:
6867
; CHECK-NEXT: call void @abort()
6968
; CHECK-NEXT: unreachable
7069
; CHECK: callee.exit:
71-
; CHECK-NEXT: call void @llvm.lifetime.end.p0(i64 20, ptr [[G_VAR]])
7270
; CHECK-NEXT: ret i32 0
7371
;
7472
call void @callee(ptr noundef byval(%struct.a) align 8 @g_var)

llvm/test/Transforms/Inline/prof-update-sample-alwaysinline.ll

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -53,6 +53,7 @@ define void @caller() {
5353
!18 = !{!"VP", i32 0, i64 140, i64 111, i64 80, i64 222, i64 40, i64 333, i64 20}
5454
attributes #0 = { alwaysinline }
5555
; CHECK: ![[ENTRY_COUNT]] = !{!"function_entry_count", i64 600}
56+
; CHECK: ![[COUNT_CALLEE1]] = !{!"branch_weights", i32 2000}
5657
; CHECK: ![[COUNT_CALLEE]] = !{!"branch_weights", i32 1200}
5758
; CHECK: ![[COUNT_IND_CALLEE]] = !{!"VP", i32 0, i64 84, i64 111, i64 48, i64 222, i64 24, i64 333, i64 12}
5859
; CHECK: ![[COUNT_CALLER]] = !{!"branch_weights", i32 800}

llvm/test/Transforms/Inline/prof-update-sample.ll

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -52,6 +52,7 @@ define void @caller() {
5252
!17 = !{!"branch_weights", i32 400}
5353
!18 = !{!"VP", i32 0, i64 140, i64 111, i64 80, i64 222, i64 40, i64 333, i64 20}
5454
; CHECK: ![[ENTRY_COUNT]] = !{!"function_entry_count", i64 600}
55+
; CHECK: ![[COUNT_CALLEE1]] = !{!"branch_weights", i32 2000}
5556
; CHECK: ![[COUNT_CALLEE]] = !{!"branch_weights", i32 1200}
5657
; CHECK: ![[COUNT_IND_CALLEE]] = !{!"VP", i32 0, i64 84, i64 111, i64 48, i64 222, i64 24, i64 333, i64 12}
5758
; CHECK: ![[COUNT_CALLER]] = !{!"branch_weights", i32 800}

0 commit comments

Comments
 (0)