217 lines
		
	
	
		
			5.5 KiB
		
	
	
	
		
			LLVM
		
	
	
	
			
		
		
	
	
			217 lines
		
	
	
		
			5.5 KiB
		
	
	
	
		
			LLVM
		
	
	
	
| ; RUN: llc -mtriple=i686-unknown-linux-gnu -mattr=+cmov %s -o - | FileCheck %s --check-prefix=CHECK32
 | |
| ; RUN: llc -mtriple=x86_64-unknown-linux-gnu -mattr=+cmov %s -o - | FileCheck %s --check-prefix=CHECK64
 | |
| ; RUN: llc -mtriple=x86_64-pc-win32 -mattr=+cmov %s -o - | FileCheck %s --check-prefix=CHECKWIN64
 | |
| 
 | |
| define i32 @one32_nooptsize() {
 | |
| entry:
 | |
|   ret i32 1
 | |
| 
 | |
| ; When not optimizing for size, use mov.
 | |
| ; CHECK32-LABEL: one32_nooptsize:
 | |
| ; CHECK32:       movl $1, %eax
 | |
| ; CHECK32-NEXT:  retl
 | |
| ; CHECK64-LABEL: one32_nooptsize:
 | |
| ; CHECK64:       movl $1, %eax
 | |
| ; CHECK64-NEXT:  retq
 | |
| }
 | |
| 
 | |
| define i32 @one32() optsize {
 | |
| entry:
 | |
|   ret i32 1
 | |
| 
 | |
| ; CHECK32-LABEL: one32:
 | |
| ; CHECK32:       xorl %eax, %eax
 | |
| ; CHECK32-NEXT:  incl %eax
 | |
| ; CHECK32-NEXT:  retl
 | |
| 
 | |
| ; FIXME: Figure out the best approach in 64-bit mode.
 | |
| ; CHECK64-LABEL: one32:
 | |
| ; CHECK64:       movl $1, %eax
 | |
| ; CHECK64-NEXT:  retq
 | |
| }
 | |
| 
 | |
| define i32 @one32_minsize() minsize {
 | |
| entry:
 | |
|   ret i32 1
 | |
| 
 | |
| ; On 32-bit, xor-inc is preferred over push-pop.
 | |
| ; CHECK32-LABEL: one32_minsize:
 | |
| ; CHECK32:       xorl %eax, %eax
 | |
| ; CHECK32-NEXT:  incl %eax
 | |
| ; CHECK32-NEXT:  retl
 | |
| 
 | |
| ; On 64-bit we don't do xor-inc yet, so push-pop it is. Note that we have to
 | |
| ; pop into a 64-bit register even when we just need 32 bits.
 | |
| ; CHECK64-LABEL: one32_minsize:
 | |
| ; CHECK64:       pushq $1
 | |
| ; CHECK64:       .cfi_adjust_cfa_offset 8
 | |
| ; CHECK64:       popq %rax
 | |
| ; CHECK64:       .cfi_adjust_cfa_offset -8
 | |
| ; CHECK64-NEXT:  retq
 | |
| 
 | |
| ; On Win64 we can't adjust the stack unless there's a frame pointer.
 | |
| ; CHECKWIN64-LABEL: one32_minsize:
 | |
| ; CHECKWIN64:       movl $1, %eax
 | |
| ; CHECKWIN64-NEXT:  retq
 | |
| }
 | |
| 
 | |
| define i32 @pr26023() minsize {
 | |
| entry:
 | |
|   %x = alloca [120 x i8]
 | |
|   %0 = getelementptr inbounds [120 x i8], [120 x i8]* %x, i64 0, i64 0
 | |
|   call void asm sideeffect "", "imr,~{memory},~{dirflag},~{fpsr},~{flags}"(i8* %0)
 | |
|   %arrayidx = getelementptr inbounds [120 x i8], [120 x i8]* %x, i64 0, i64 119
 | |
|   store volatile i8 -2, i8* %arrayidx
 | |
|   call void asm sideeffect "", "r,~{dirflag},~{fpsr},~{flags}"(i32 5)
 | |
|   %1 = load volatile i8, i8* %arrayidx
 | |
|   %conv = sext i8 %1 to i32
 | |
|   ret i32 %conv
 | |
| 
 | |
| ; The function writes to the redzone, so push/pop cannot be used.
 | |
| ; CHECK64-LABEL: pr26023:
 | |
| ; CHECK64:       movl $5, %ecx
 | |
| ; CHECK64:       retq
 | |
| 
 | |
| ; 32-bit X86 doesn't have a redzone.
 | |
| ; CHECK32-LABEL: pr26023:
 | |
| ; CHECK32:       pushl $5
 | |
| ; CHECK32:       popl %ecx
 | |
| ; CHECK32:       retl
 | |
| }
 | |
| 
 | |
| 
 | |
| define i64 @one64_minsize() minsize {
 | |
| entry:
 | |
|   ret i64 1
 | |
| ; On 64-bit we don't do xor-inc yet, so push-pop it is.
 | |
| ; CHECK64-LABEL: one64_minsize:
 | |
| ; CHECK64:       pushq $1
 | |
| ; CHECK64:       .cfi_adjust_cfa_offset 8
 | |
| ; CHECK64:       popq %rax
 | |
| ; CHECK64:       .cfi_adjust_cfa_offset -8
 | |
| ; CHECK64-NEXT:  retq
 | |
| 
 | |
| ; On Win64 we can't adjust the stack unless there's a frame pointer.
 | |
| ; CHECKWIN64-LABEL: one64_minsize:
 | |
| ; CHECKWIN64:       movl $1, %eax
 | |
| ; CHECKWIN64-NEXT:  retq
 | |
| }
 | |
| 
 | |
| define i32 @minus_one32() optsize {
 | |
| entry:
 | |
|   ret i32 -1
 | |
| 
 | |
| ; CHECK32-LABEL: minus_one32:
 | |
| ; CHECK32:       xorl %eax, %eax
 | |
| ; CHECK32-NEXT:  decl %eax
 | |
| ; CHECK32-NEXT:  retl
 | |
| }
 | |
| 
 | |
| define i32 @minus_one32_minsize() minsize {
 | |
| entry:
 | |
|   ret i32 -1
 | |
| 
 | |
| ; xor-dec is preferred over push-pop.
 | |
| ; CHECK32-LABEL: minus_one32_minsize:
 | |
| ; CHECK32:       xorl %eax, %eax
 | |
| ; CHECK32-NEXT:  decl %eax
 | |
| ; CHECK32-NEXT:  retl
 | |
| }
 | |
| 
 | |
| define i16 @one16() optsize {
 | |
| entry:
 | |
|   ret i16 1
 | |
| 
 | |
| ; CHECK32-LABEL: one16:
 | |
| ; CHECK32:       xorl %eax, %eax
 | |
| ; CHECK32-NEXT:  incl %eax
 | |
| ; CHECK32-NEXT:  # kill
 | |
| ; CHECK32-NEXT:  retl
 | |
| }
 | |
| 
 | |
| define i16 @minus_one16() optsize {
 | |
| entry:
 | |
|   ret i16 -1
 | |
| 
 | |
| ; CHECK32-LABEL: minus_one16:
 | |
| ; CHECK32:       xorl %eax, %eax
 | |
| ; CHECK32-NEXT:  decl %eax
 | |
| ; CHECK32-NEXT:  # kill
 | |
| ; CHECK32-NEXT:  retl
 | |
| }
 | |
| 
 | |
| define i32 @minus_five32() minsize {
 | |
| entry:
 | |
|   ret i32 -5
 | |
| 
 | |
| ; CHECK32-LABEL: minus_five32:
 | |
| ; CHECK32: pushl $-5
 | |
| ; CHECK32: popl %eax
 | |
| ; CHECK32: retl
 | |
| }
 | |
| 
 | |
| define i64 @minus_five64() minsize {
 | |
| entry:
 | |
|   ret i64 -5
 | |
| 
 | |
| ; CHECK64-LABEL: minus_five64:
 | |
| ; CHECK64: pushq $-5
 | |
| ; CHECK64:       .cfi_adjust_cfa_offset 8
 | |
| ; CHECK64: popq %rax
 | |
| ; CHECK64:       .cfi_adjust_cfa_offset -8
 | |
| ; CHECK64: retq
 | |
| }
 | |
| 
 | |
| define i32 @rematerialize_minus_one() optsize {
 | |
| entry:
 | |
|   ; Materialize -1 (thiscall forces it into %ecx).
 | |
|   tail call x86_thiscallcc void @f(i32 -1)
 | |
| 
 | |
|   ; Clobber all registers except %esp, leaving nowhere to store the -1 besides
 | |
|   ; spilling it to the stack.
 | |
|   tail call void asm sideeffect "", "~{eax},~{ebx},~{ecx},~{edx},~{edi},~{esi},~{ebp},~{dirflag},~{fpsr},~{flags}"()
 | |
| 
 | |
|   ; -1 should be re-materialized here instead of getting spilled above.
 | |
|   ret i32 -1
 | |
| 
 | |
| ; CHECK32-LABEL: rematerialize_minus_one
 | |
| ; CHECK32:       xorl %ecx, %ecx
 | |
| ; CHECK32-NEXT:  decl %ecx
 | |
| ; CHECK32:       calll
 | |
| ; CHECK32:       xorl %eax, %eax
 | |
| ; CHECK32-NEXT:  decl %eax
 | |
| ; CHECK32-NOT:   %eax
 | |
| ; CHECK32:       retl
 | |
| }
 | |
| 
 | |
| define i32 @rematerialize_minus_one_eflags(i32 %x) optsize {
 | |
| entry:
 | |
|   ; Materialize -1 (thiscall forces it into %ecx).
 | |
|   tail call x86_thiscallcc void @f(i32 -1)
 | |
| 
 | |
|   ; Clobber all registers except %esp, leaving nowhere to store the -1 besides
 | |
|   ; spilling it to the stack.
 | |
|   tail call void asm sideeffect "", "~{eax},~{ebx},~{ecx},~{edx},~{edi},~{esi},~{ebp},~{dirflag},~{fpsr},~{flags}"()
 | |
| 
 | |
|   ; Define eflags.
 | |
|   %a = icmp ne i32 %x, 123
 | |
|   %b = zext i1 %a to i32
 | |
|   ; Cause -1 to be rematerialized right in front of the cmov, which needs eflags.
 | |
|   ; It must therefore not use the xor-dec lowering.
 | |
|   %c = select i1 %a, i32 %b, i32 -1
 | |
|   ret i32 %c
 | |
| 
 | |
| ; CHECK32-LABEL: rematerialize_minus_one_eflags
 | |
| ; CHECK32:       xorl %ecx, %ecx
 | |
| ; CHECK32-NEXT:  decl %ecx
 | |
| ; CHECK32:       calll
 | |
| ; CHECK32:       cmpl
 | |
| ; CHECK32:       setne
 | |
| ; CHECK32-NOT:   xorl
 | |
| ; CHECK32:       movl $-1
 | |
| ; CHECK32:       cmov
 | |
| ; CHECK32:       retl
 | |
| }
 | |
| 
 | |
| declare x86_thiscallcc void @f(i32)
 |