Skip to content

[GlobalIsel] Improve poison analysis #93731

New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

Merged
merged 1 commit into from
Jul 12, 2024
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
54 changes: 53 additions & 1 deletion llvm/lib/CodeGen/GlobalISel/Utils.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -1785,7 +1785,6 @@ static bool canCreateUndefOrPoison(Register Reg, const MachineRegisterInfo &MRI,

// Check whether opcode is a poison/undef-generating operation.
switch (RegDef->getOpcode()) {
case TargetOpcode::G_FREEZE:
case TargetOpcode::G_BUILD_VECTOR:
case TargetOpcode::G_CONSTANT_FOLD_BARRIER:
return false;
Expand Down Expand Up @@ -1827,6 +1826,50 @@ static bool canCreateUndefOrPoison(Register Reg, const MachineRegisterInfo &MRI,
case TargetOpcode::G_USHLSAT:
return includesPoison(Kind) &&
!shiftAmountKnownInRange(RegDef->getOperand(2).getReg(), MRI);
case TargetOpcode::G_INSERT_VECTOR_ELT: {
GInsertVectorElement *Insert = cast<GInsertVectorElement>(RegDef);
if (includesPoison(Kind)) {
std::optional<ValueAndVReg> Index =
getIConstantVRegValWithLookThrough(Insert->getIndexReg(), MRI);
if (!Index)
return true;
LLT VecTy = MRI.getType(Insert->getVectorReg());
return Index->Value.uge(VecTy.getElementCount().getKnownMinValue());
}
return false;
}
case TargetOpcode::G_EXTRACT_VECTOR_ELT: {
GExtractVectorElement *Extract = cast<GExtractVectorElement>(RegDef);
if (includesPoison(Kind)) {
std::optional<ValueAndVReg> Index =
getIConstantVRegValWithLookThrough(Extract->getIndexReg(), MRI);
if (!Index)
return true;
LLT VecTy = MRI.getType(Extract->getVectorReg());
return Index->Value.uge(VecTy.getElementCount().getKnownMinValue());
}
return false;
}
case TargetOpcode::G_SHUFFLE_VECTOR: {
GShuffleVector *Shuffle = cast<GShuffleVector>(RegDef);
ArrayRef<int> Mask = Shuffle->getMask();
return includesPoison(Kind) && is_contained(Mask, -1);
}
case TargetOpcode::G_FNEG:
case TargetOpcode::G_PHI:
case TargetOpcode::G_SELECT:
case TargetOpcode::G_UREM:
case TargetOpcode::G_SREM:
case TargetOpcode::G_FREEZE:
case TargetOpcode::G_ICMP:
case TargetOpcode::G_FCMP:
case TargetOpcode::G_FADD:
case TargetOpcode::G_FSUB:
case TargetOpcode::G_FMUL:
case TargetOpcode::G_FDIV:
case TargetOpcode::G_FREM:
case TargetOpcode::G_PTR_ADD:
return false;
default:
return !isa<GCastOp>(RegDef) && !isa<GBinOp>(RegDef);
}
Expand Down Expand Up @@ -1858,6 +1901,15 @@ static bool isGuaranteedNotToBeUndefOrPoison(Register Reg,
return false;
return true;
}
case TargetOpcode::G_PHI: {
GPhi *Phi = cast<GPhi>(RegDef);
unsigned NumIncoming = Phi->getNumIncomingValues();
for (unsigned I = 0; I < NumIncoming; ++I)
if (!::isGuaranteedNotToBeUndefOrPoison(Phi->getIncomingValue(I), MRI,
Depth + 1, Kind))
return false;
return true;
}
default: {
auto MOCheck = [&](const MachineOperand &MO) {
if (!MO.isReg())
Expand Down
296 changes: 292 additions & 4 deletions llvm/test/CodeGen/AArch64/GlobalISel/combine-freeze.mir
Original file line number Diff line number Diff line change
Expand Up @@ -655,8 +655,7 @@ body: |
; CHECK-NEXT: %c:_(s64) = G_CONSTANT_FOLD_BARRIER %cst
; CHECK-NEXT: %d:_(s64) = G_CONSTANT_FOLD_BARRIER %cst
; CHECK-NEXT: %cmp:_(s1) = G_ICMP intpred(eq), %c(s64), %d
; CHECK-NEXT: [[FREEZE:%[0-9]+]]:_(s1) = G_FREEZE %cmp
; CHECK-NEXT: %ext:_(s64) = G_ZEXT [[FREEZE]](s1)
; CHECK-NEXT: %ext:_(s64) = G_ZEXT %cmp(s1)
; CHECK-NEXT: $x0 = COPY %ext(s64)
; CHECK-NEXT: RET_ReallyLR implicit $x0
%0:_(s64) = COPY $x0
Expand All @@ -682,8 +681,7 @@ body: |
; CHECK-NEXT: %c:_(s64) = G_CONSTANT_FOLD_BARRIER %cst
; CHECK-NEXT: %d:_(s64) = G_CONSTANT_FOLD_BARRIER %cst
; CHECK-NEXT: %cmp:_(s1) = G_FCMP floatpred(oeq), %c(s64), %d
; CHECK-NEXT: [[FREEZE:%[0-9]+]]:_(s1) = G_FREEZE %cmp
; CHECK-NEXT: %ext:_(s64) = G_ZEXT [[FREEZE]](s1)
; CHECK-NEXT: %ext:_(s64) = G_ZEXT %cmp(s1)
; CHECK-NEXT: $x0 = COPY %ext(s64)
; CHECK-NEXT: RET_ReallyLR implicit $x0
%0:_(s64) = COPY $x0
Expand Down Expand Up @@ -1152,3 +1150,293 @@ body: |
%2:_(s64) = G_FREEZE %1
$x0 = COPY %2(s64)
RET_ReallyLR implicit $x0
...
---
name: freeze_fneg_fold_barrier
body: |
bb.1:
liveins: $w0

; CHECK-LABEL: name: freeze_fneg_fold_barrier
; CHECK: liveins: $w0
; CHECK-NEXT: {{ $}}
; CHECK-NEXT: %cst:_(s64) = G_FCONSTANT double 0.000000e+00
; CHECK-NEXT: %c:_(s64) = G_CONSTANT_FOLD_BARRIER %cst
; CHECK-NEXT: [[FNEG:%[0-9]+]]:_(s64) = G_FNEG %c
; CHECK-NEXT: $x0 = COPY [[FNEG]](s64)
; CHECK-NEXT: RET_ReallyLR implicit $x0
%0:_(s64) = COPY $x0
%cst:_(s64) = G_FCONSTANT double 0.0
%c:_(s64) = G_CONSTANT_FOLD_BARRIER %cst
%d:_(s64) = G_CONSTANT_FOLD_BARRIER %cst
%1:_(s64) = G_FNEG %c
%2:_(s64) = G_FREEZE %1
$x0 = COPY %2(s64)
RET_ReallyLR implicit $x0
...
---
name: freeze_frem_fold_barrier
body: |
bb.1:
liveins: $w0

; CHECK-LABEL: name: freeze_frem_fold_barrier
; CHECK: liveins: $w0
; CHECK-NEXT: {{ $}}
; CHECK-NEXT: %cst:_(s64) = G_FCONSTANT double 0.000000e+00
; CHECK-NEXT: %c:_(s64) = G_CONSTANT_FOLD_BARRIER %cst
; CHECK-NEXT: %d:_(s64) = G_CONSTANT_FOLD_BARRIER %cst
; CHECK-NEXT: [[FREM:%[0-9]+]]:_(s64) = G_FREM %c, %d
; CHECK-NEXT: $x0 = COPY [[FREM]](s64)
; CHECK-NEXT: RET_ReallyLR implicit $x0
%0:_(s64) = COPY $x0
%cst:_(s64) = G_FCONSTANT double 0.0
%c:_(s64) = G_CONSTANT_FOLD_BARRIER %cst
%d:_(s64) = G_CONSTANT_FOLD_BARRIER %cst
%1:_(s64) = G_FREM %c, %d
%2:_(s64) = G_FREEZE %1
$x0 = COPY %2(s64)
RET_ReallyLR implicit $x0
...
---
name: freeze_fdiv_fold_barrier
body: |
bb.1:
liveins: $w0

; CHECK-LABEL: name: freeze_fdiv_fold_barrier
; CHECK: liveins: $w0
; CHECK-NEXT: {{ $}}
; CHECK-NEXT: %cst:_(s64) = G_FCONSTANT double 0.000000e+00
; CHECK-NEXT: %c:_(s64) = G_CONSTANT_FOLD_BARRIER %cst
; CHECK-NEXT: %d:_(s64) = G_CONSTANT_FOLD_BARRIER %cst
; CHECK-NEXT: [[FDIV:%[0-9]+]]:_(s64) = G_FDIV %c, %d
; CHECK-NEXT: $x0 = COPY [[FDIV]](s64)
; CHECK-NEXT: RET_ReallyLR implicit $x0
%0:_(s64) = COPY $x0
%cst:_(s64) = G_FCONSTANT double 0.0
%c:_(s64) = G_CONSTANT_FOLD_BARRIER %cst
%d:_(s64) = G_CONSTANT_FOLD_BARRIER %cst
%1:_(s64) = G_FDIV %c, %d
%2:_(s64) = G_FREEZE %1
$x0 = COPY %2(s64)
RET_ReallyLR implicit $x0
...
---
name: freeze_fmul_fold_barrier
body: |
bb.1:
liveins: $w0

; CHECK-LABEL: name: freeze_fmul_fold_barrier
; CHECK: liveins: $w0
; CHECK-NEXT: {{ $}}
; CHECK-NEXT: %cst:_(s64) = G_FCONSTANT double 0.000000e+00
; CHECK-NEXT: %c:_(s64) = G_CONSTANT_FOLD_BARRIER %cst
; CHECK-NEXT: %d:_(s64) = G_CONSTANT_FOLD_BARRIER %cst
; CHECK-NEXT: [[FMUL:%[0-9]+]]:_(s64) = G_FMUL %c, %d
; CHECK-NEXT: $x0 = COPY [[FMUL]](s64)
; CHECK-NEXT: RET_ReallyLR implicit $x0
%0:_(s64) = COPY $x0
%cst:_(s64) = G_FCONSTANT double 0.0
%c:_(s64) = G_CONSTANT_FOLD_BARRIER %cst
%d:_(s64) = G_CONSTANT_FOLD_BARRIER %cst
%1:_(s64) = G_FMUL %c, %d
%2:_(s64) = G_FREEZE %1
$x0 = COPY %2(s64)
RET_ReallyLR implicit $x0
...
---
name: freeze_fsub_fold_barrier
body: |
bb.1:
liveins: $w0

; CHECK-LABEL: name: freeze_fsub_fold_barrier
; CHECK: liveins: $w0
; CHECK-NEXT: {{ $}}
; CHECK-NEXT: %cst:_(s64) = G_FCONSTANT double 0.000000e+00
; CHECK-NEXT: %c:_(s64) = G_CONSTANT_FOLD_BARRIER %cst
; CHECK-NEXT: %d:_(s64) = G_CONSTANT_FOLD_BARRIER %cst
; CHECK-NEXT: [[FSUB:%[0-9]+]]:_(s64) = G_FSUB %c, %d
; CHECK-NEXT: $x0 = COPY [[FSUB]](s64)
; CHECK-NEXT: RET_ReallyLR implicit $x0
%0:_(s64) = COPY $x0
%cst:_(s64) = G_FCONSTANT double 0.0
%c:_(s64) = G_CONSTANT_FOLD_BARRIER %cst
%d:_(s64) = G_CONSTANT_FOLD_BARRIER %cst
%1:_(s64) = G_FSUB %c, %d
%2:_(s64) = G_FREEZE %1
$x0 = COPY %2(s64)
RET_ReallyLR implicit $x0
...
---
name: freeze_fadd_fold_barrier
body: |
bb.1:
liveins: $w0

; CHECK-LABEL: name: freeze_fadd_fold_barrier
; CHECK: liveins: $w0
; CHECK-NEXT: {{ $}}
; CHECK-NEXT: %cst:_(s64) = G_FCONSTANT double 0.000000e+00
; CHECK-NEXT: %c:_(s64) = G_CONSTANT_FOLD_BARRIER %cst
; CHECK-NEXT: %d:_(s64) = G_CONSTANT_FOLD_BARRIER %cst
; CHECK-NEXT: [[FADD:%[0-9]+]]:_(s64) = G_FADD %c, %d
; CHECK-NEXT: $x0 = COPY [[FADD]](s64)
; CHECK-NEXT: RET_ReallyLR implicit $x0
%0:_(s64) = COPY $x0
%cst:_(s64) = G_FCONSTANT double 0.0
%c:_(s64) = G_CONSTANT_FOLD_BARRIER %cst
%d:_(s64) = G_CONSTANT_FOLD_BARRIER %cst
%1:_(s64) = G_FADD %c, %d
%2:_(s64) = G_FREEZE %1
$x0 = COPY %2(s64)
RET_ReallyLR implicit $x0
...
---
name: freeze_urem_fold_barrier
body: |
bb.1:
liveins: $w0

; CHECK-LABEL: name: freeze_urem_fold_barrier
; CHECK: liveins: $w0
; CHECK-NEXT: {{ $}}
; CHECK-NEXT: %cst:_(s64) = G_CONSTANT i64 9
; CHECK-NEXT: %c:_(s64) = G_CONSTANT_FOLD_BARRIER %cst
; CHECK-NEXT: %d:_(s64) = G_CONSTANT_FOLD_BARRIER %cst
; CHECK-NEXT: [[UREM:%[0-9]+]]:_(s64) = G_UREM %c, %d
; CHECK-NEXT: $x0 = COPY [[UREM]](s64)
; CHECK-NEXT: RET_ReallyLR implicit $x0
%0:_(s64) = COPY $x0
%cst:_(s64) = G_CONSTANT i64 9
%c:_(s64) = G_CONSTANT_FOLD_BARRIER %cst
%d:_(s64) = G_CONSTANT_FOLD_BARRIER %cst
%1:_(s64) = G_UREM %c, %d
%2:_(s64) = G_FREEZE %1
$x0 = COPY %2(s64)
RET_ReallyLR implicit $x0
...
---
name: freeze_srem_fold_barrier
body: |
bb.1:
liveins: $w0

; CHECK-LABEL: name: freeze_srem_fold_barrier
; CHECK: liveins: $w0
; CHECK-NEXT: {{ $}}
; CHECK-NEXT: %cst:_(s64) = G_CONSTANT i64 9
; CHECK-NEXT: %c:_(s64) = G_CONSTANT_FOLD_BARRIER %cst
; CHECK-NEXT: %d:_(s64) = G_CONSTANT_FOLD_BARRIER %cst
; CHECK-NEXT: [[SREM:%[0-9]+]]:_(s64) = G_SREM %c, %d
; CHECK-NEXT: $x0 = COPY [[SREM]](s64)
; CHECK-NEXT: RET_ReallyLR implicit $x0
%0:_(s64) = COPY $x0
%cst:_(s64) = G_CONSTANT i64 9
%c:_(s64) = G_CONSTANT_FOLD_BARRIER %cst
%d:_(s64) = G_CONSTANT_FOLD_BARRIER %cst
%1:_(s64) = G_SREM %c, %d
%2:_(s64) = G_FREEZE %1
$x0 = COPY %2(s64)
RET_ReallyLR implicit $x0
...
---
name: freeze_ptradd_fold_barrier
body: |
bb.1:
liveins: $w0

; CHECK-LABEL: name: freeze_ptradd_fold_barrier
; CHECK: liveins: $w0
; CHECK-NEXT: {{ $}}
; CHECK-NEXT: %p:_(p0) = COPY $x0
; CHECK-NEXT: %cst:_(s64) = G_CONSTANT i64 9
; CHECK-NEXT: [[FREEZE:%[0-9]+]]:_(p0) = G_FREEZE %p
; CHECK-NEXT: [[PTR_ADD:%[0-9]+]]:_(p0) = G_PTR_ADD [[FREEZE]], %cst(s64)
; CHECK-NEXT: $x0 = COPY [[PTR_ADD]](p0)
; CHECK-NEXT: RET_ReallyLR implicit $x0
%0:_(s64) = COPY $x0
%p:_(p0) = COPY $x0
%cst:_(s64) = G_CONSTANT i64 9
%c:_(s64) = G_CONSTANT_FOLD_BARRIER %cst
%d:_(s64) = G_CONSTANT_FOLD_BARRIER %cst
%1:_(p0) = G_PTR_ADD %p, %cst
%2:_(p0) = G_FREEZE %1
$x0 = COPY %2(p0)
RET_ReallyLR implicit $x0
...
---
# select (false, x, y) -> y
name: freeze_select_fold_barrier
body: |
bb.1:
liveins: $x0, $x1
; CHECK-LABEL: name: freeze_select_fold_barrier
; CHECK: liveins: $x0, $x1
; CHECK-NEXT: {{ $}}
; CHECK-NEXT: [[COPY:%[0-9]+]]:_(s64) = COPY $x1
; CHECK-NEXT: [[FREEZE:%[0-9]+]]:_(s64) = G_FREEZE [[COPY]]
; CHECK-NEXT: $x0 = COPY [[FREEZE]](s64)
%0:_(s64) = COPY $x0
%1:_(s64) = COPY $x1
%2:_(s1) = G_CONSTANT i1 false
%3:_(s64) = G_SELECT %2, %0, %1
%4:_(s64) = G_FREEZE %3
$x0 = COPY %4(s64)
...
---
name: freeze_extract_and_shuffle_vector_fold_barrier
body: |
bb.1:
liveins: $x0, $x1
; CHECK-LABEL: name: freeze_extract_and_shuffle_vector_fold_barrier
; CHECK: liveins: $x0, $x1
; CHECK-NEXT: {{ $}}
; CHECK-NEXT: %arg1:_(<4 x s32>) = COPY $q0
; CHECK-NEXT: %arg2:_(<4 x s32>) = COPY $q1
; CHECK-NEXT: %idx:_(s64) = G_CONSTANT i64 0
; CHECK-NEXT: %sv:_(<4 x s32>) = G_SHUFFLE_VECTOR %arg1(<4 x s32>), %arg2, shufflemask(3, 0, 0, 0)
; CHECK-NEXT: %freeze_sv:_(<4 x s32>) = G_FREEZE %sv
; CHECK-NEXT: %extract:_(s32) = G_EXTRACT_VECTOR_ELT %freeze_sv(<4 x s32>), %idx(s64)
; CHECK-NEXT: $w0 = COPY %extract(s32)
; CHECK-NEXT: RET_ReallyLR implicit $x0
%arg1:_(<4 x s32>) = COPY $q0
%arg2:_(<4 x s32>) = COPY $q1
%idx:_(s64) = G_CONSTANT i64 0
%sv:_(<4 x s32>) = G_SHUFFLE_VECTOR %arg1(<4 x s32>), %arg2(<4 x s32>), shufflemask(3, 0, 0, 0)
%freeze_sv:_(<4 x s32>) = G_FREEZE %sv
%extract:_(s32) = G_EXTRACT_VECTOR_ELT %freeze_sv(<4 x s32>), %idx(s64)
%freeze:_(s32) = G_FREEZE %extract
$w0 = COPY %extract(s32)
RET_ReallyLR implicit $x0
...
---
name: freeze_insert_and_shuffle_vector_fold_barrier
body: |
bb.1:
liveins: $x0, $x1
; CHECK-LABEL: name: freeze_insert_and_shuffle_vector_fold_barrier
; CHECK: liveins: $x0, $x1
; CHECK-NEXT: {{ $}}
; CHECK-NEXT: %elt:_(s32) = COPY $w0
; CHECK-NEXT: %arg1:_(<4 x s32>) = COPY $q0
; CHECK-NEXT: %arg2:_(<4 x s32>) = COPY $q1
; CHECK-NEXT: %idx:_(s64) = G_CONSTANT i64 0
; CHECK-NEXT: %sv:_(<4 x s32>) = G_SHUFFLE_VECTOR %arg1(<4 x s32>), %arg2, shufflemask(3, 0, 0, 0)
; CHECK-NEXT: %freeze_sv:_(<4 x s32>) = G_FREEZE %sv
; CHECK-NEXT: [[FREEZE:%[0-9]+]]:_(s32) = G_FREEZE %elt
; CHECK-NEXT: %extract:_(<4 x s32>) = G_INSERT_VECTOR_ELT %freeze_sv, [[FREEZE]](s32), %idx(s64)
; CHECK-NEXT: $q0 = COPY %extract(<4 x s32>)
; CHECK-NEXT: RET_ReallyLR implicit $x0
%elt:_(s32) = COPY $w0
%arg1:_(<4 x s32>) = COPY $q0
%arg2:_(<4 x s32>) = COPY $q1
%idx:_(s64) = G_CONSTANT i64 0
%sv:_(<4 x s32>) = G_SHUFFLE_VECTOR %arg1(<4 x s32>), %arg2(<4 x s32>), shufflemask(3, 0, 0, 0)
%freeze_sv:_(<4 x s32>) = G_FREEZE %sv
%extract:_(<4 x s32>) = G_INSERT_VECTOR_ELT %freeze_sv(<4 x s32>), %elt(s32), %idx(s64)
%freeze:_(<4 x s32>) = G_FREEZE %extract
$q0 = COPY %freeze(<4 x s32>)
RET_ReallyLR implicit $x0
Loading