@@ -5310,18 +5310,18 @@ static MachineBasicBlock *lowerWaveReduce(MachineInstr &MI,
5310
5310
case AMDGPU::S_MAX_U32:
5311
5311
case AMDGPU::S_MAX_I32:
5312
5312
case AMDGPU::S_AND_B32:
5313
- case AMDGPU::S_AND_B64:
5314
- case AMDGPU::S_OR_B32:
5315
- case AMDGPU::S_OR_B64: {
5313
+ case AMDGPU::S_OR_B32: {
5316
5314
// Idempotent operations.
5317
5315
BuildMI(BB, MI, DL, TII->get(AMDGPU::S_MOV_B32), DstReg).addReg(SrcReg);
5318
5316
RetBB = &BB;
5319
5317
break;
5320
5318
}
5321
- case AMDGPU::V_CMP_LT_U64_e64: // umin
5322
- case AMDGPU::V_CMP_LT_I64_e64: // min
5323
- case AMDGPU::V_CMP_GT_U64_e64: // umax
5324
- case AMDGPU::V_CMP_GT_I64_e64: { // max
5319
+ case AMDGPU::V_CMP_LT_U64_e64: // umin
5320
+ case AMDGPU::V_CMP_LT_I64_e64: // min
5321
+ case AMDGPU::V_CMP_GT_U64_e64: // umax
5322
+ case AMDGPU::V_CMP_GT_I64_e64: // max
5323
+ case AMDGPU::S_AND_B64:
5324
+ case AMDGPU::S_OR_B64: {
5325
5325
// Idempotent operations.
5326
5326
BuildMI(BB, MI, DL, TII->get(AMDGPU::S_MOV_B64), DstReg).addReg(SrcReg);
5327
5327
RetBB = &BB;
@@ -5365,7 +5365,7 @@ static MachineBasicBlock *lowerWaveReduce(MachineInstr &MI,
5365
5365
.addReg(NewAccumulator->getOperand(0).getReg())
5366
5366
.addImm(1)
5367
5367
.setOperandDead(3); // Dead scc
5368
- if (is32BitOpc ) {
5368
+ if (Opc == AMDGPU::S_XOR_B32 ) {
5369
5369
BuildMI(BB, MI, DL, TII->get(AMDGPU::S_MUL_I32), DstReg)
5370
5370
.addReg(SrcReg)
5371
5371
.addReg(ParityRegister);
0 commit comments