[X86] Relax restrictions on what setcc condition codes can be folded with a sext when AVX512 is enabled.
We now allow all signed comparisons and not equal. The complement that needs to be added for this is no worse than the extend. And the vector output forms of pcmpeq/pcmpgt have better latency than the k-register version on SKX. llvm-svn: 324294
This commit is contained in:
parent
d9a97a20c0
commit
9c6c7c5e9b
|
|
@ -36118,8 +36118,7 @@ static SDValue combineExtSetcc(SDNode *N, SelectionDAG &DAG,
|
|||
// Don't fold if the condition code can't be handled by PCMPEQ/PCMPGT since
|
||||
// that's the only integer compares with we have.
|
||||
ISD::CondCode CC = cast<CondCodeSDNode>(N0->getOperand(2))->get();
|
||||
if (ISD::isUnsignedIntSetCC(CC) || CC == ISD::SETLE || CC == ISD::SETGE ||
|
||||
CC == ISD::SETNE)
|
||||
if (ISD::isUnsignedIntSetCC(CC))
|
||||
return SDValue();
|
||||
|
||||
// Only do this combine if the extension will be fully consumed by the setcc.
|
||||
|
|
|
|||
|
|
@ -1415,8 +1415,8 @@ define <8 x i32> @sext_8i1_8i32(<8 x i32> %a1, <8 x i32> %a2) nounwind {
|
|||
;
|
||||
; SKX-LABEL: sext_8i1_8i32:
|
||||
; SKX: # %bb.0:
|
||||
; SKX-NEXT: vpcmpled %ymm0, %ymm1, %k0
|
||||
; SKX-NEXT: vpmovm2d %k0, %ymm0
|
||||
; SKX-NEXT: vpcmpgtd %ymm0, %ymm1, %ymm0
|
||||
; SKX-NEXT: vpternlogq $15, %ymm0, %ymm0, %ymm0
|
||||
; SKX-NEXT: retq
|
||||
%x = icmp slt <8 x i32> %a1, %a2
|
||||
%x1 = xor <8 x i1>%x, <i1 true, i1 true, i1 true, i1 true, i1 true, i1 true, i1 true, i1 true>
|
||||
|
|
|
|||
|
|
@ -4365,14 +4365,14 @@ define i8 @trunc_8i16_to_8i1(<8 x i16> %a) {
|
|||
define <8 x i32> @sext_8i1_8i32(<8 x i32> %a1, <8 x i32> %a2) nounwind {
|
||||
; GENERIC-LABEL: sext_8i1_8i32:
|
||||
; GENERIC: # %bb.0:
|
||||
; GENERIC-NEXT: vpcmpled %ymm0, %ymm1, %k0 # sched: [3:1.00]
|
||||
; GENERIC-NEXT: vpmovm2d %k0, %ymm0 # sched: [1:0.33]
|
||||
; GENERIC-NEXT: vpcmpgtd %ymm0, %ymm1, %ymm0 # sched: [3:1.00]
|
||||
; GENERIC-NEXT: vpternlogq $15, %ymm0, %ymm0, %ymm0 # sched: [3:1.00]
|
||||
; GENERIC-NEXT: retq # sched: [1:1.00]
|
||||
;
|
||||
; SKX-LABEL: sext_8i1_8i32:
|
||||
; SKX: # %bb.0:
|
||||
; SKX-NEXT: vpcmpled %ymm0, %ymm1, %k0 # sched: [3:1.00]
|
||||
; SKX-NEXT: vpmovm2d %k0, %ymm0 # sched: [1:0.25]
|
||||
; SKX-NEXT: vpcmpgtd %ymm0, %ymm1, %ymm0 # sched: [1:0.50]
|
||||
; SKX-NEXT: vpternlogq $15, %ymm0, %ymm0, %ymm0 # sched: [1:0.33]
|
||||
; SKX-NEXT: retq # sched: [7:1.00]
|
||||
%x = icmp slt <8 x i32> %a1, %a2
|
||||
%x1 = xor <8 x i1>%x, <i1 true, i1 true, i1 true, i1 true, i1 true, i1 true, i1 true, i1 true>
|
||||
|
|
|
|||
Loading…
Reference in New Issue