190 lines
		
	
	
		
			7.3 KiB
		
	
	
	
		
			LLVM
		
	
	
	
			
		
		
	
	
			190 lines
		
	
	
		
			7.3 KiB
		
	
	
	
		
			LLVM
		
	
	
	
; RUN: llc < %s -mtriple=i386-pc-win32 -mattr=+sse | FileCheck --check-prefix=WIN32 %s
 | 
						|
; RUN: llc < %s -mtriple=x86_64-win32 -mattr=+sse | FileCheck --check-prefix=WIN64 %s
 | 
						|
; RUN: llc < %s -mtriple=x86_64-linux-gnu -mattr=+sse | FileCheck --check-prefix=LINUXOSX %s
 | 
						|
 | 
						|
; WIN32-LABEL:  test_argReti1:
 | 
						|
; WIN32:        incb  %al
 | 
						|
; WIN32:        ret{{.*}}
 | 
						|
 | 
						|
; WIN64-LABEL:  test_argReti1:
 | 
						|
; WIN64:        incb  %al
 | 
						|
; WIN64:        ret{{.*}}
 | 
						|
 | 
						|
; Test regcall when receiving/returning i1
 | 
						|
define x86_regcallcc i1 @test_argReti1(i1 %a)  {
 | 
						|
  %add = add i1 %a, 1
 | 
						|
  ret i1 %add
 | 
						|
}
 | 
						|
 | 
						|
; WIN32-LABEL:  test_CallargReti1:
 | 
						|
; WIN32:        movzbl  %al, %eax
 | 
						|
; WIN32:        call{{.*}}   {{.*}}test_argReti1
 | 
						|
; WIN32:        incb  %al
 | 
						|
; WIN32:        ret{{.*}}
 | 
						|
 | 
						|
; WIN64-LABEL:  test_CallargReti1:
 | 
						|
; WIN64:        movzbl  %al, %eax
 | 
						|
; WIN64:        call{{.*}}   {{.*}}test_argReti1
 | 
						|
; WIN64:        incb  %al
 | 
						|
; WIN64:        ret{{.*}}
 | 
						|
 | 
						|
; Test regcall when passing/retrieving i1
 | 
						|
define x86_regcallcc i1 @test_CallargReti1(i1 %a)  {
 | 
						|
  %b = add i1 %a, 1
 | 
						|
  %c = call x86_regcallcc i1 @test_argReti1(i1 %b)
 | 
						|
  %d = add i1 %c, 1
 | 
						|
  ret i1 %d
 | 
						|
}
 | 
						|
 | 
						|
; WIN64-LABEL: testf32_inp
 | 
						|
; WIN64: movaps {{%xmm(1[2-5])}}, {{.*(%r(b|s)p).*}}  {{#+}} 16-byte Spill
 | 
						|
; WIN64: movaps {{%xmm(1[2-5])}}, {{.*(%r(b|s)p).*}}  {{#+}} 16-byte Spill
 | 
						|
; WIN64: movaps {{%xmm(1[2-5])}}, {{.*(%r(b|s)p).*}}  {{#+}} 16-byte Spill
 | 
						|
; WIN64: movaps {{%xmm(1[2-5])}}, {{.*(%r(b|s)p).*}}  {{#+}} 16-byte Spill
 | 
						|
; WIN64: {{.*}} {{%xmm([0-9]|1[0-1])}}, {{%xmm(1[2-5])}}
 | 
						|
; WIN64: {{.*}} {{%xmm([0-9]|1[0-1])}}, {{%xmm(1[2-5])}}
 | 
						|
; WIN64: {{.*}} {{%xmm([0-9]|1[0-1])}}, {{%xmm(1[2-5])}}
 | 
						|
; WIN64: {{.*}} {{%xmm([0-9]|1[0-1])}}, {{%xmm(1[2-5])}}
 | 
						|
; WIN64: movaps {{.*(%r(b|s)p).*}}, {{%xmm(1[2-5])}}  {{#+}} 16-byte Reload
 | 
						|
; WIN64: movaps {{.*(%r(b|s)p).*}}, {{%xmm(1[2-5])}}  {{#+}} 16-byte Reload
 | 
						|
; WIN64: movaps {{.*(%r(b|s)p).*}}, {{%xmm(1[2-5])}}  {{#+}} 16-byte Reload
 | 
						|
; WIN64: movaps {{.*(%r(b|s)p).*}}, {{%xmm(1[2-5])}}  {{#+}} 16-byte Reload
 | 
						|
; WIN64: retq
 | 
						|
 | 
						|
; WIN32-LABEL: testf32_inp
 | 
						|
; WIN32: movaps {{%xmm([0-7])}}, {{.*(%e(b|s)p).*}}  {{#+}} 16-byte Spill
 | 
						|
; WIN32: {{.*}} {{%xmm[0-7]}}, {{%xmm[4-7]}}
 | 
						|
; WIN32: {{.*}} {{%xmm[0-7]}}, {{%xmm[4-7]}}
 | 
						|
; WIN32: {{.*}} {{%xmm[0-7]}}, {{%xmm[4-7]}}
 | 
						|
; WIN32: {{.*}} {{%xmm[0-7]}}, {{%xmm[4-7]}}
 | 
						|
; WIN32: movaps {{.*(%e(b|s)p).*}}, {{%xmm([0-7])}}  {{#+}} 16-byte Reload
 | 
						|
; WIN32: retl
 | 
						|
 | 
						|
; LINUXOSX-LABEL: testf32_inp
 | 
						|
; LINUXOSX: movaps {{%xmm(1[2-5])}}, {{.*(%r(b|s)p).*}}  {{#+}} 16-byte Spill
 | 
						|
; LINUXOSX: movaps {{%xmm(1[2-5])}}, {{.*(%r(b|s)p).*}}  {{#+}} 16-byte Spill
 | 
						|
; LINUXOSX: movaps {{%xmm(1[2-5])}}, {{.*(%r(b|s)p).*}}  {{#+}} 16-byte Spill
 | 
						|
; LINUXOSX: movaps {{%xmm(1[2-5])}}, {{.*(%r(b|s)p).*}}  {{#+}} 16-byte Spill
 | 
						|
; LINUXOSX: {{.*}} {{%xmm([0-9]|1[0-1])}}, {{%xmm(1[2-5])}}
 | 
						|
; LINUXOSX: {{.*}} {{%xmm([0-9]|1[0-1])}}, {{%xmm(1[2-5])}}
 | 
						|
; LINUXOSX: {{.*}} {{%xmm([0-9]|1[0-1])}}, {{%xmm(1[2-5])}}
 | 
						|
; LINUXOSX: {{.*}} {{%xmm([0-9]|1[0-1])}}, {{%xmm(1[2-5])}}
 | 
						|
; LINUXOSX: movaps {{.*(%r(b|s)p).*}}, {{%xmm(1[2-5])}}  {{#+}} 16-byte Reload
 | 
						|
; LINUXOSX: movaps {{.*(%r(b|s)p).*}}, {{%xmm(1[2-5])}}  {{#+}} 16-byte Reload
 | 
						|
; LINUXOSX: movaps {{.*(%r(b|s)p).*}}, {{%xmm(1[2-5])}}  {{#+}} 16-byte Reload
 | 
						|
; LINUXOSX: movaps {{.*(%r(b|s)p).*}}, {{%xmm(1[2-5])}}  {{#+}} 16-byte Reload
 | 
						|
; LINUXOSX: retq
 | 
						|
 | 
						|
;test calling conventions - input parameters, callee saved xmms
 | 
						|
define x86_regcallcc <16 x float> @testf32_inp(<16 x float> %a, <16 x float> %b, <16 x float> %c) nounwind {
 | 
						|
  %x1 = fadd <16 x float> %a, %b
 | 
						|
  %x2 = fmul <16 x float> %a, %b
 | 
						|
  %x3 = fsub <16 x float> %x1, %x2
 | 
						|
  %x4 = fadd <16 x float> %x3, %c
 | 
						|
  ret <16 x float> %x4
 | 
						|
}
 | 
						|
 | 
						|
; WIN32-LABEL: testi32_inp
 | 
						|
; WIN32: pushl {{%e(si|di|bx|bp)}}
 | 
						|
; WIN32: pushl {{%e(si|di|bx|bp)}}
 | 
						|
; WIN32: popl {{%e(si|di|bx|bp)}}
 | 
						|
; WIN32: popl {{%e(si|di|bx|bp)}}
 | 
						|
; WIN32: retl
 | 
						|
 | 
						|
; WIN64-LABEL: testi32_inp
 | 
						|
; WIN64: pushq	{{%r(bp|bx|1[0-5])}}
 | 
						|
; WIN64: pushq	{{%r(bp|bx|1[0-5])}}
 | 
						|
; WIN64: pushq	{{%r(bp|bx|1[0-5])}}
 | 
						|
; WIN64: popq	{{%r(bp|bx|1[0-5])}}
 | 
						|
; WIN64: popq	{{%r(bp|bx|1[0-5])}}
 | 
						|
; WIN64: popq	{{%r(bp|bx|1[0-5])}}
 | 
						|
; WIN64: retq
 | 
						|
 | 
						|
; LINUXOSX-LABEL: testi32_inp
 | 
						|
; LINUXOSX: pushq	{{%r(bp|bx|1[2-5])}}
 | 
						|
; LINUXOSX: pushq	{{%r(bp|bx|1[2-5])}}
 | 
						|
; LINUXOSX: popq	{{%r(bp|bx|1[2-5])}}
 | 
						|
; LINUXOSX: popq	{{%r(bp|bx|1[2-5])}}
 | 
						|
; LINUXOSX: retq
 | 
						|
 | 
						|
;test calling conventions - input parameters, callee saved GPRs
 | 
						|
define x86_regcallcc i32 @testi32_inp(i32 %a1, i32 %a2, i32 %a3, i32 %a4, i32 %a5, i32 %a6,
 | 
						|
                                      i32 %b1, i32 %b2, i32 %b3, i32 %b4, i32 %b5, i32 %b6) nounwind {
 | 
						|
  %x1 = sub i32 %a1, %a2
 | 
						|
  %x2 = sub i32 %a3, %a4
 | 
						|
  %x3 = sub i32 %a5, %a6
 | 
						|
  %y1 = sub i32 %b1, %b2
 | 
						|
  %y2 = sub i32 %b3, %b4
 | 
						|
  %y3 = sub i32 %b5, %b6
 | 
						|
  %v1 = add i32 %a1, %a2
 | 
						|
  %v2 = add i32 %a3, %a4
 | 
						|
  %v3 = add i32 %a5, %a6
 | 
						|
  %w1 = add i32 %b1, %b2
 | 
						|
  %w2 = add i32 %b3, %b4
 | 
						|
  %w3 = add i32 %b5, %b6
 | 
						|
  %s1 = mul i32 %x1, %y1
 | 
						|
  %s2 = mul i32 %x2, %y2
 | 
						|
  %s3 = mul i32 %x3, %y3
 | 
						|
  %t1 = mul i32 %v1, %w1
 | 
						|
  %t2 = mul i32 %v2, %w2
 | 
						|
  %t3 = mul i32 %v3, %w3
 | 
						|
  %m1 = add i32 %s1, %s2
 | 
						|
  %m2 = add i32 %m1, %s3
 | 
						|
  %n1 = add i32 %t1, %t2
 | 
						|
  %n2 = add i32 %n1, %t3
 | 
						|
  %r1 = add i32 %m2, %n2
 | 
						|
  ret i32 %r1
 | 
						|
}
 | 
						|
 | 
						|
; X32: testf32_stack
 | 
						|
; X32: movaps {{%xmm([0-7])}}, {{(-*[0-9])+}}(%ebp)
 | 
						|
; X32: movaps {{%xmm([0-7])}}, {{(-*[0-9])+}}(%ebp)
 | 
						|
; X32: movaps {{%xmm([0-7])}}, {{(-*[0-9])+}}(%ebp)
 | 
						|
; X32: movaps {{%xmm([0-7])}}, {{(-*[0-9])+}}(%ebp)
 | 
						|
; X32: addps {{([0-9])+}}(%ebp), {{%xmm([0-7])}}
 | 
						|
; X32: addps {{([0-9])+}}(%ebp), {{%xmm([0-7])}}
 | 
						|
; X32: addps {{([0-9])+}}(%ebp), {{%xmm([0-7])}}
 | 
						|
; X32: addps {{([0-9])+}}(%ebp), {{%xmm([0-7])}}
 | 
						|
; X32: addps {{([0-9])+}}(%ebp), {{%xmm([0-7])}}
 | 
						|
; X32: addps {{([0-9])+}}(%ebp), {{%xmm([0-7])}}
 | 
						|
; X32: addps {{([0-9])+}}(%ebp), {{%xmm([0-7])}}
 | 
						|
; X32: addps {{([0-9])+}}(%ebp), {{%xmm([0-7])}}
 | 
						|
; X32: addps {{([0-9])+}}(%ebp), {{%xmm([0-7])}}
 | 
						|
; X32: addps {{([0-9])+}}(%ebp), {{%xmm([0-7])}}
 | 
						|
; X32: addps {{([0-9])+}}(%ebp), {{%xmm([0-7])}}
 | 
						|
; X32: addps {{([0-9])+}}(%ebp), {{%xmm([0-7])}}
 | 
						|
; X32: addps {{([0-9])+}}(%ebp), {{%xmm([0-7])}}
 | 
						|
; X32: addps {{([0-9])+}}(%ebp), {{%xmm([0-7])}}
 | 
						|
; X32: addps {{([0-9])+}}(%ebp), {{%xmm([0-7])}}
 | 
						|
; X32: addps {{([0-9])+}}(%ebp), {{%xmm([0-7])}}
 | 
						|
; X32: movaps {{(-*[0-9])+}}(%ebp), {{%xmm([0-7])}}
 | 
						|
; X32: movaps {{(-*[0-9])+}}(%ebp), {{%xmm([0-7])}}
 | 
						|
; X32: movaps {{(-*[0-9])+}}(%ebp), {{%xmm([0-7])}}
 | 
						|
; X32: movaps {{(-*[0-9])+}}(%ebp), {{%xmm([0-7])}}
 | 
						|
 | 
						|
; LINUXOSX: testf32_stack
 | 
						|
; LINUXOSX: addps {{%xmm([0-9]+)}}, {{%xmm([0-9]+)}}
 | 
						|
; LINUXOSX: addps {{%xmm([0-9]+)}}, {{%xmm([0-9]+)}}
 | 
						|
; LINUXOSX: addps {{%xmm([0-9]+)}}, {{%xmm([0-9]+)}}
 | 
						|
; LINUXOSX: addps {{%xmm([0-9]+)}}, {{%xmm([0-9]+)}}
 | 
						|
; LINUXOSX: addps {{%xmm([0-9]+)}}, {{%xmm([0-9]+)}}
 | 
						|
; LINUXOSX: addps {{%xmm([0-9]+)}}, {{%xmm([0-9]+)}}
 | 
						|
; LINUXOSX: addps {{%xmm([0-9]+)}}, {{%xmm([0-9]+)}}
 | 
						|
; LINUXOSX: addps {{%xmm([0-9]+)}}, {{%xmm([0-9]+)}}
 | 
						|
; LINUXOSX: addps {{([0-9])+}}(%rsp), {{%xmm([0-7])}}
 | 
						|
; LINUXOSX: addps {{([0-9])+}}(%rsp), {{%xmm([0-7])}}
 | 
						|
; LINUXOSX: addps {{([0-9])+}}(%rsp), {{%xmm([0-7])}}
 | 
						|
; LINUXOSX: addps {{([0-9])+}}(%rsp), {{%xmm([0-7])}}
 | 
						|
; LINUXOSX: addps {{([0-9])+}}(%rsp), {{%xmm([0-7])}}
 | 
						|
; LINUXOSX: addps {{([0-9])+}}(%rsp), {{%xmm([0-7])}}
 | 
						|
; LINUXOSX: addps {{([0-9])+}}(%rsp), {{%xmm([0-7])}}
 | 
						|
; LINUXOSX: addps {{([0-9])+}}(%rsp), {{%xmm([0-7])}}
 | 
						|
; LINUXOSX: retq
 | 
						|
 | 
						|
; Test that parameters, overflowing register capacity, are passed through the stack
 | 
						|
define x86_regcallcc <32 x float> @testf32_stack(<32 x float> %a, <32 x float> %b, <32 x float> %c) nounwind {
 | 
						|
  %x1 = fadd <32 x float> %a, %b
 | 
						|
  %x2 = fadd <32 x float> %x1, %c
 | 
						|
  ret <32 x float> %x2
 | 
						|
}
 |