Skip to content

Commit 45f1295

Browse files
bcheng0127igcbot
authored andcommitted
Enable GRF read delay of send stall instructions
Enable the vISA option -schedWithSendSrcReadCycle
1 parent bc3034f commit 45f1295

File tree

3 files changed

+9
-2
lines changed

3 files changed

+9
-2
lines changed

visa/HWCaps.inc

Lines changed: 7 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -845,6 +845,13 @@ bool needNopAfterCFInstWA() const {
845845
return false;
846846
}
847847

848+
bool scheduleStoreAway() const {
849+
const TARGET_PLATFORM p = getPlatform();
850+
if (p >= Xe_PVCXT)
851+
return getOption(vISA_schedWithSendSrcReadCycle);
852+
return false;
853+
}
854+
848855
bool hasReadSuppressionOrSharedLocalMemoryWAs() const {
849856
return getPlatform() < Xe2;
850857
}

visa/LocalScheduler/LocalScheduler_G4IR.cpp

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -2820,7 +2820,7 @@ uint32_t DDD::getEdgeLatency_old(Node *node, DepType depT) const {
28202820

28212821
case WAR_MEMORY:
28222822
case WAW_MEMORY:
2823-
if (kernel->getOption(vISA_schedWithSendSrcReadCycle)) {
2823+
if (kernel->fg.builder->scheduleStoreAway()) {
28242824
latency = LT.getSendSrcReadLatency(inst);
28252825
} else {
28262826
latency = UNCOMPR_LATENCY;

visa/include/VISAOptionsDefs.h

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -435,7 +435,7 @@ DEF_VISA_OPTION(vISA_ScheduleACCDep, ET_BOOL, "-scheduleACCDep",
435435
"Enable scheduling with accurate ACC dependence, instead of "
436436
"coarse grained dependence",
437437
false)
438-
DEF_VISA_OPTION(vISA_schedWithSendSrcReadCycle, ET_BOOL, "-schedWithSendSrcReadCycle", UNUSED, false)
438+
DEF_VISA_OPTION(vISA_schedWithSendSrcReadCycle, ET_BOOL_TRUE, "-schedWithSendSrcReadCycle", UNUSED, true)
439439

440440
//=== SWSB options ===
441441
DEF_VISA_OPTION(vISA_USEL3HIT, ET_BOOL, "-SBIDL3Hit", UNUSED, false)

0 commit comments

Comments
 (0)