@@ -7948,11 +7948,11 @@ bool Optimizer::foldPseudoAndOr(G4_BB* bb, INST_LIST_ITER& ii)
7948
7948
instBuffer.push_back (addInst);
7949
7949
};
7950
7950
7951
- // (W) and (1) r127.2<1>:ud r0.0<0;1,0>:ud 0xFFFFFFE0
7951
+ // (W) and (1) r127.2<1>:ud r0.0<0;1,0>:ud 0xFFFFFFC0
7952
7952
auto getStartAddrInst = [this , &instBuffer, r0, rtail](int subreg)
7953
7953
{
7954
- // (W) and (1) r127.2<1>:ud r0.0<0;1,0>:ud 0xFFFFFFE0
7955
- uint32_t GRFMask = 0x1F ;
7954
+ // (W) and (1) r127.2<1>:ud r0.0<0;1,0>:ud 0xFFFFFFC0
7955
+ uint32_t GRFMask = 0x3F ;
7956
7956
auto src0 = builder.createSrc (r0->getRegVar (), 0 , 0 ,
7957
7957
builder.getRegionScalar (), Type_UD);
7958
7958
auto src1 = builder.createImm (~GRFMask, Type_UD);
@@ -8017,7 +8017,7 @@ bool Optimizer::foldPseudoAndOr(G4_BB* bb, INST_LIST_ITER& ii)
8017
8017
8018
8018
// compute per-thread starting address (r127.2)
8019
8019
// (W) mov (8) r127.0:ud 0x0
8020
- // (W) and (1) r127.2<1>:ud r0.0<0;1,0>:ud 0xFFFFFFE0 // start address
8020
+ // (W) and (1) r127.2<1>:ud r0.0<0;1,0>:ud 0xFFFFFFC0 // start address
8021
8021
// (W) and (1) r127.0:uw r0.4:uw(tid) 0xFF // tid
8022
8022
// (W) add (1) r127.2 r127.2 cross_thread_size
8023
8023
// (W) mad (1) r127.2 r127.2 r127.0 per_thread_size
0 commit comments