74 lines
		
	
	
		
			1.8 KiB
		
	
	
	
		
			LLVM
		
	
	
	
			
		
		
	
	
			74 lines
		
	
	
		
			1.8 KiB
		
	
	
	
		
			LLVM
		
	
	
	
| ; Test 32-bit square root.
 | |
| ;
 | |
| ; RUN: llc < %s -mtriple=s390x-linux-gnu | FileCheck %s
 | |
| 
 | |
| declare float @llvm.sqrt.f32(float %f)
 | |
| 
 | |
| ; Check register square root.
 | |
| define float @f1(float %val) {
 | |
| ; CHECK: f1:
 | |
| ; CHECK: sqebr %f0, %f0
 | |
| ; CHECK: br %r14
 | |
|   %res = call float @llvm.sqrt.f32(float %val)
 | |
|   ret float %res
 | |
| }
 | |
| 
 | |
| ; Check the low end of the SQEB range.
 | |
| define float @f2(float *%ptr) {
 | |
| ; CHECK: f2:
 | |
| ; CHECK: sqeb %f0, 0(%r2)
 | |
| ; CHECK: br %r14
 | |
|   %val = load float *%ptr
 | |
|   %res = call float @llvm.sqrt.f32(float %val)
 | |
|   ret float %res
 | |
| }
 | |
| 
 | |
| ; Check the high end of the aligned SQEB range.
 | |
| define float @f3(float *%base) {
 | |
| ; CHECK: f3:
 | |
| ; CHECK: sqeb %f0, 4092(%r2)
 | |
| ; CHECK: br %r14
 | |
|   %ptr = getelementptr float *%base, i64 1023
 | |
|   %val = load float *%ptr
 | |
|   %res = call float @llvm.sqrt.f32(float %val)
 | |
|   ret float %res
 | |
| }
 | |
| 
 | |
| ; Check the next word up, which needs separate address logic.
 | |
| ; Other sequences besides this one would be OK.
 | |
| define float @f4(float *%base) {
 | |
| ; CHECK: f4:
 | |
| ; CHECK: aghi %r2, 4096
 | |
| ; CHECK: sqeb %f0, 0(%r2)
 | |
| ; CHECK: br %r14
 | |
|   %ptr = getelementptr float *%base, i64 1024
 | |
|   %val = load float *%ptr
 | |
|   %res = call float @llvm.sqrt.f32(float %val)
 | |
|   ret float %res
 | |
| }
 | |
| 
 | |
| ; Check negative displacements, which also need separate address logic.
 | |
| define float @f5(float *%base) {
 | |
| ; CHECK: f5:
 | |
| ; CHECK: aghi %r2, -4
 | |
| ; CHECK: sqeb %f0, 0(%r2)
 | |
| ; CHECK: br %r14
 | |
|   %ptr = getelementptr float *%base, i64 -1
 | |
|   %val = load float *%ptr
 | |
|   %res = call float @llvm.sqrt.f32(float %val)
 | |
|   ret float %res
 | |
| }
 | |
| 
 | |
| ; Check that SQEB allows indices.
 | |
| define float @f6(float *%base, i64 %index) {
 | |
| ; CHECK: f6:
 | |
| ; CHECK: sllg %r1, %r3, 2
 | |
| ; CHECK: sqeb %f0, 400(%r1,%r2)
 | |
| ; CHECK: br %r14
 | |
|   %ptr1 = getelementptr float *%base, i64 %index
 | |
|   %ptr2 = getelementptr float *%ptr1, i64 100
 | |
|   %val = load float *%ptr2
 | |
|   %res = call float @llvm.sqrt.f32(float %val)
 | |
|   ret float %res
 | |
| }
 |