Skip to content
Merged
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
27 changes: 20 additions & 7 deletions llvm/lib/Target/AMDGPU/GCNHazardRecognizer.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -1143,6 +1143,7 @@ bool GCNHazardRecognizer::fixVcmpxPermlaneHazards(MachineInstr *MI) {
bool GCNHazardRecognizer::fixVMEMtoScalarWriteHazards(MachineInstr *MI) {
if (!ST.hasVMEMtoScalarWriteHazard())
return false;
assert(!ST.hasExtendedWaitCounts());

if (!SIInstrInfo::isSALU(*MI) && !SIInstrInfo::isSMRD(*MI))
return false;
Expand Down Expand Up @@ -1189,6 +1190,7 @@ bool GCNHazardRecognizer::fixVMEMtoScalarWriteHazards(MachineInstr *MI) {
bool GCNHazardRecognizer::fixSMEMtoVectorWriteHazards(MachineInstr *MI) {
if (!ST.hasSMEMtoVectorWriteHazard())
return false;
assert(!ST.hasExtendedWaitCounts());

if (!SIInstrInfo::isVALU(*MI))
return false;
Expand Down Expand Up @@ -1273,7 +1275,11 @@ bool GCNHazardRecognizer::fixSMEMtoVectorWriteHazards(MachineInstr *MI) {
}

bool GCNHazardRecognizer::fixVcmpxExecWARHazard(MachineInstr *MI) {
if (!ST.hasVcmpxExecWARHazard() || !SIInstrInfo::isVALU(*MI))
if (!ST.hasVcmpxExecWARHazard())
return false;
assert(!ST.hasExtendedWaitCounts());

if (!SIInstrInfo::isVALU(*MI))
return false;

const SIRegisterInfo *TRI = ST.getRegisterInfo();
Expand Down Expand Up @@ -1343,6 +1349,7 @@ bool GCNHazardRecognizer::fixLdsBranchVmemWARHazard(MachineInstr *MI) {
return false;

assert(ST.hasLdsBranchVmemWARHazard());
assert(!ST.hasExtendedWaitCounts());

auto IsHazardInst = [](const MachineInstr &MI) {
if (SIInstrInfo::isDS(MI))
Expand Down Expand Up @@ -1452,6 +1459,8 @@ bool GCNHazardRecognizer::fixLdsDirectVMEMHazard(MachineInstr *MI) {
return I.readsRegister(VDSTReg, &TRI) || I.modifiesRegister(VDSTReg, &TRI);
};
bool LdsdirCanWait = ST.hasLdsWaitVMSRC();
// TODO: On GFX12 the hazard should expire on S_WAIT_LOADCNT/SAMPLECNT/BVHCNT
// according to the type of VMEM instruction.
auto IsExpiredFn = [this, LdsdirCanWait](const MachineInstr &I, int) {
return SIInstrInfo::isVALU(I) || SIInstrInfo::isEXP(I) ||
(I.getOpcode() == AMDGPU::S_WAITCNT && !I.getOperand(0).getImm()) ||
Expand All @@ -1477,11 +1486,11 @@ bool GCNHazardRecognizer::fixLdsDirectVMEMHazard(MachineInstr *MI) {
}

bool GCNHazardRecognizer::fixVALUPartialForwardingHazard(MachineInstr *MI) {
if (!ST.isWave64())
return false;
if (!ST.hasVALUPartialForwardingHazard())
return false;
if (!SIInstrInfo::isVALU(*MI))
assert(!ST.hasExtendedWaitCounts());

if (!ST.isWave64() || !SIInstrInfo::isVALU(*MI))
return false;

SmallSetVector<Register, 4> SrcVGPRs;
Expand Down Expand Up @@ -1628,6 +1637,8 @@ bool GCNHazardRecognizer::fixVALUPartialForwardingHazard(MachineInstr *MI) {
bool GCNHazardRecognizer::fixVALUTransUseHazard(MachineInstr *MI) {
if (!ST.hasVALUTransUseHazard())
return false;
assert(!ST.hasExtendedWaitCounts());

if (!SIInstrInfo::isVALU(*MI))
return false;

Expand Down Expand Up @@ -1767,6 +1778,7 @@ bool GCNHazardRecognizer::fixWMMAHazards(MachineInstr *MI) {
bool GCNHazardRecognizer::fixShift64HighRegBug(MachineInstr *MI) {
if (!ST.hasShift64HighRegBug())
return false;
assert(!ST.hasExtendedWaitCounts());

switch (MI->getOpcode()) {
default:
Expand Down Expand Up @@ -1896,6 +1908,7 @@ int GCNHazardRecognizer::checkFPAtomicToDenormModeHazard(MachineInstr *MI) {

if (!ST.hasFPAtomicToDenormModeHazard())
return 0;
assert(!ST.hasExtendedWaitCounts());

if (MI->getOpcode() != AMDGPU::S_DENORM_MODE)
return 0;
Expand Down Expand Up @@ -2721,11 +2734,11 @@ bool GCNHazardRecognizer::ShouldPreferAnother(SUnit *SU) {
}

bool GCNHazardRecognizer::fixVALUMaskWriteHazard(MachineInstr *MI) {
if (!ST.isWave64())
return false;
if (!ST.hasVALUMaskWriteHazard())
return false;
if (!SIInstrInfo::isSALU(*MI))
assert(!ST.hasExtendedWaitCounts());

if (!ST.isWave64() || !SIInstrInfo::isSALU(*MI))
return false;

// The hazard sequence is three instructions:
Expand Down