[x86] put nops into the WriteNop class and customize for Jaguar

1. Given that we already have a classification bucket with 'nop' in the name, 
   that's where 'nop' belongs. Right now, it's only used for prefix bytes and 'pause'.
2. Make the latency of this class '1' for Jaguar to tell the scheduler (and presumably 
   llvm-mca) how to model the resource requirements better even though a nop has no 
   dependencies.

Differential Revision: https://reviews.llvm.org/D44608

llvm-svn: 327853
This commit is contained in:
Sanjay Patel 2018-03-19 14:26:50 +00:00
parent 749788eab6
commit 05daae75ad
6 changed files with 19 additions and 17 deletions

View File

@ -667,10 +667,10 @@ def FNCLEX : I<0xDB, MRM_E2, (outs), (ins), "fnclex", [], IIC_FNCLEX>;
} // Defs = [FPSW]
} // SchedRW
// Operandless floating-point instructions for the disassembler.
let SchedRW = [WriteMicrocoded] in {
def FNOP : I<0xD9, MRM_D0, (outs), (ins), "fnop", [], IIC_FNOP>;
// Operand-less floating-point instructions for the disassembler.
def FNOP : I<0xD9, MRM_D0, (outs), (ins), "fnop", [], IIC_FNOP>, Sched<[WriteNop]>;
let SchedRW = [WriteMicrocoded] in {
let Defs = [FPSW] in {
def WAIT : I<0x9B, RawFrm, (outs), (ins), "wait", [], IIC_WAIT>;
def FXAM : I<0xD9, MRM_E5, (outs), (ins), "fxam", [], IIC_FXAM>;

View File

@ -1133,7 +1133,7 @@ def trunc_su : PatFrag<(ops node:$src), (trunc node:$src), [{
//
// Nop
let hasSideEffects = 0, SchedRW = [WriteZero] in {
let hasSideEffects = 0, SchedRW = [WriteNop] in {
def NOOP : I<0x90, RawFrm, (outs), (ins), "nop", [], IIC_NOP>;
def NOOPW : I<0x1f, MRMXm, (outs), (ins i16mem:$zero),
"nop{w}\t$zero", [], IIC_NOP>, TB, OpSize16;

View File

@ -286,7 +286,9 @@ defm : JWriteResIntPair<WriteJump, [JALU01], 1>;
def : WriteRes<WriteSystem, [JALU01]> { let Latency = 100; }
def : WriteRes<WriteMicrocoded, [JALU01]> { let Latency = 100; }
def : WriteRes<WriteFence, [JSAGU]>;
def : WriteRes<WriteNop, []>;
// Nops don't have dependencies, so there's no actual latency, but we set this
// to '1' to tell the scheduler that the nop uses an ALU slot for a cycle.
def : WriteRes<WriteNop, [JALU01]> { let Latency = 1; }
////////////////////////////////////////////////////////////////////////////////
// Floating point. This covers both scalar and vector operations.

View File

@ -8389,13 +8389,13 @@ define void @test_nop(i16 %a0, i32 %a1, i64 %a2, i16 *%p0, i32 *%p1, i64 *%p2) o
; BTVER2-LABEL: test_nop:
; BTVER2: # %bb.0:
; BTVER2-NEXT: #APP
; BTVER2-NEXT: nop # sched: [1:?]
; BTVER2-NEXT: nopw %di # sched: [1:?]
; BTVER2-NEXT: nopw (%rcx) # sched: [1:?]
; BTVER2-NEXT: nopl %esi # sched: [1:?]
; BTVER2-NEXT: nopl (%r8) # sched: [1:?]
; BTVER2-NEXT: nopq %rdx # sched: [1:?]
; BTVER2-NEXT: nopq (%r9) # sched: [1:?]
; BTVER2-NEXT: nop # sched: [1:0.50]
; BTVER2-NEXT: nopw %di # sched: [1:0.50]
; BTVER2-NEXT: nopw (%rcx) # sched: [1:0.50]
; BTVER2-NEXT: nopl %esi # sched: [1:0.50]
; BTVER2-NEXT: nopl (%r8) # sched: [1:0.50]
; BTVER2-NEXT: nopq %rdx # sched: [1:0.50]
; BTVER2-NEXT: nopq (%r9) # sched: [1:0.50]
; BTVER2-NEXT: #NO_APP
; BTVER2-NEXT: retq # sched: [4:1.00]
;
@ -9500,7 +9500,7 @@ define void @test_pause() optsize {
; BTVER2-LABEL: test_pause:
; BTVER2: # %bb.0:
; BTVER2-NEXT: #APP
; BTVER2-NEXT: pause # sched: [1:?]
; BTVER2-NEXT: pause # sched: [1:0.50]
; BTVER2-NEXT: #NO_APP
; BTVER2-NEXT: retq # sched: [4:1.00]
;

View File

@ -3763,7 +3763,7 @@ define <4 x float> @test_xorps(<4 x float> %a0, <4 x float> %a1, <4 x float> *%a
ret <4 x float> %7
}
; 'WriteZero' class instructions.
; 'WriteZero' and 'WriteNop' class instructions.
define <4 x float> @test_fnop() nounwind {
; GENERIC-LABEL: test_fnop:
@ -3840,7 +3840,7 @@ define <4 x float> @test_fnop() nounwind {
; BTVER2: # %bb.0:
; BTVER2-NEXT: vxorps %xmm0, %xmm0, %xmm0 # sched: [1:0.50]
; BTVER2-NEXT: #APP
; BTVER2-NEXT: nop # sched: [1:?]
; BTVER2-NEXT: nop # sched: [1:0.50]
; BTVER2-NEXT: #NO_APP
; BTVER2-NEXT: retq # sched: [4:1.00]
;

View File

@ -3209,7 +3209,7 @@ define void @test_fnop() optsize {
; SLM-LABEL: test_fnop:
; SLM: # %bb.0:
; SLM-NEXT: #APP
; SLM-NEXT: fnop # sched: [100:1.00]
; SLM-NEXT: fnop # sched: [1:?]
; SLM-NEXT: #NO_APP
; SLM-NEXT: retl # sched: [4:1.00]
;
@ -3251,7 +3251,7 @@ define void @test_fnop() optsize {
; BTVER2-LABEL: test_fnop:
; BTVER2: # %bb.0:
; BTVER2-NEXT: #APP
; BTVER2-NEXT: fnop # sched: [100:0.50]
; BTVER2-NEXT: fnop # sched: [1:0.50]
; BTVER2-NEXT: #NO_APP
; BTVER2-NEXT: retl # sched: [4:1.00]
;