Skip to content

Commit 359fde6

Browse files
committed
Formatting and tidying up, responding to reviewer comments
1 parent 8bdc32c commit 359fde6

File tree

5 files changed

+117
-3935
lines changed

5 files changed

+117
-3935
lines changed

llvm/lib/Target/AMDGPU/AMDGPUISelLowering.cpp

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -5077,7 +5077,7 @@ SDValue AMDGPUTargetLowering::performFNegCombine(SDNode *N,
50775077
EVT LHVT = LHS.getValueType();
50785078
EVT RHVT = RHS.getValueType();
50795079
// The regression was limited to i32 v2/i32.
5080-
if(RHVT != MVT::i32 && LHVT != MVT::i32)
5080+
if (RHVT != MVT::i32 && LHVT != MVT::i32)
50815081
return SDValue();
50825082

50835083
SDValue LFNeg = DAG.getNode(ISD::FNEG, SL, LHVT, LHS);

llvm/lib/Target/AMDGPU/SIISelLowering.cpp

Lines changed: 0 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -13014,12 +13014,8 @@ SDValue SITargetLowering::performXorCombine(SDNode *N,
1301413014
return DAG.getNode(ISD::BITCAST, DL, VT, NewSelect);
1301513015
}
1301613016
}
13017-
// Possibly split vector here if one side does have a constant RHS.
1301813017
}
1301913018

13020-
// Add test for when only one of the RHS vector elements is a const. Might be
13021-
// possible to optimise this case.
13022-
1302313019
const ConstantSDNode *CRHS = dyn_cast<ConstantSDNode>(RHS);
1302413020

1302513021
if (CRHS && VT == MVT::i64) {

llvm/lib/Target/AMDGPU/SIInstructions.td

Lines changed: 18 additions & 26 deletions
Original file line numberDiff line numberDiff line change
@@ -1793,7 +1793,6 @@ def : GCNPat <
17931793
>;
17941794
}
17951795

1796-
17971796
/********** ================================ **********/
17981797
/********** Floating point absolute/negative **********/
17991798
/********** ================================ **********/
@@ -2389,31 +2388,25 @@ def : GCNPat<(i32 (trunc (srl i64:$src0, (i32 ShiftAmt32Imm:$src1)))),
23892388
} // end True16Predicate = NotHasTrue16BitInsts
23902389

23912390
let True16Predicate = UseRealTrue16Insts in {
2391+
def : GCNPat<(rotr i32:$src0, i32:$src1),
2392+
(V_ALIGNBIT_B32_t16_e64 /* src0_modifiers */ 0, $src0,
2393+
/* src1_modifiers */ 0, $src0,
2394+
/* src2_modifiers */ 0, (EXTRACT_SUBREG $src1, lo16),
2395+
/* clamp */ 0, /* op_sel */ 0)>;
23922396

2393-
def : GCNPat <
2394-
(rotr i32:$src0, i32:$src1),
2395-
(V_ALIGNBIT_B32_t16_e64 /* src0_modifiers */ 0, $src0,
2396-
/* src1_modifiers */ 0, $src0,
2397-
/* src2_modifiers */ 0,
2398-
(EXTRACT_SUBREG $src1, lo16),
2399-
/* clamp */ 0, /* op_sel */ 0)
2400-
>;
2401-
2402-
def : GCNPat<(i32 (trunc (srl i64:$src0, (i32 ShiftAmt32Imm:$src1)))),
2403-
(V_ALIGNBIT_B32_t16_e64 0, /* src0_modifiers */
2404-
(i32 (EXTRACT_SUBREG (i64 $src0), sub1)),
2405-
0, /* src1_modifiers */
2406-
(i32 (EXTRACT_SUBREG (i64 $src0), sub0)),
2407-
0, /* src2_modifiers */
2408-
(i16 (EXTRACT_SUBREG VGPR_32:$src1, lo16)),
2409-
/* clamp */ 0, /* op_sel */ 0)>;
2410-
2411-
def : GCNPat<(fshr i32:$src0, i32:$src1, i32:$src2),
2412-
(V_ALIGNBIT_B32_t16_e64 /* src0_modifiers */ 0, $src0,
2413-
/* src1_modifiers */ 0, $src1,
2414-
/* src2_modifiers */ 0,
2415-
(EXTRACT_SUBREG VGPR_32:$src2, lo16),
2416-
/* clamp */ 0, /* op_sel */ 0)>;
2397+
def : GCNPat<
2398+
(i32(trunc(srl i64:$src0, (i32 ShiftAmt32Imm:$src1)))),
2399+
(V_ALIGNBIT_B32_t16_e64 0, /* src0_modifiers */
2400+
(i32(EXTRACT_SUBREG(i64 $src0), sub1)), 0, /* src1_modifiers */
2401+
(i32(EXTRACT_SUBREG(i64 $src0), sub0)), 0, /* src2_modifiers */
2402+
(i16(EXTRACT_SUBREG VGPR_32:$src1, lo16)),
2403+
/* clamp */ 0, /* op_sel */ 0)>;
2404+
2405+
def : GCNPat<(fshr i32:$src0, i32:$src1, i32:$src2),
2406+
(V_ALIGNBIT_B32_t16_e64 /* src0_modifiers */ 0, $src0,
2407+
/* src1_modifiers */ 0, $src1,
2408+
/* src2_modifiers */ 0, (EXTRACT_SUBREG VGPR_32:$src2, lo16),
2409+
/* clamp */ 0, /* op_sel */ 0)>;
24172410
} // end True16Predicate = UseRealTrue16Insts
24182411

24192412
let True16Predicate = UseFakeTrue16Insts in {
@@ -2451,7 +2444,6 @@ def : GCNPat<(fshr i32:$src0, i32:$src1, i32:$src2),
24512444
>;
24522445
} // end True16Predicate = UseFakeTrue16Insts
24532446

2454-
24552447
/********** ====================== **********/
24562448
/********** Indirect addressing **********/
24572449
/********** ====================== **********/

0 commit comments

Comments
 (0)