46 lines
		
	
	
		
			1.6 KiB
		
	
	
	
		
			LLVM
		
	
	
	
			
		
		
	
	
			46 lines
		
	
	
		
			1.6 KiB
		
	
	
	
		
			LLVM
		
	
	
	
| ; RUN: opt  -mtriple amdgcn-unknown-amdhsa -analyze -divergence -use-gpu-divergence-analysis %s | FileCheck %s
 | |
| 
 | |
| declare i32 @llvm.amdgcn.workitem.id.x() #0
 | |
| declare i32 @llvm.amdgcn.workitem.id.y() #0
 | |
| declare i32 @llvm.amdgcn.workitem.id.z() #0
 | |
| declare i32 @llvm.amdgcn.mbcnt.lo(i32, i32) #0
 | |
| declare i32 @llvm.amdgcn.mbcnt.hi(i32, i32) #0
 | |
| 
 | |
| ; CHECK: DIVERGENT:  %id.x = call i32 @llvm.amdgcn.workitem.id.x()
 | |
| define amdgpu_kernel void @workitem_id_x() #1 {
 | |
|   %id.x = call i32 @llvm.amdgcn.workitem.id.x()
 | |
|   store volatile i32 %id.x, i32 addrspace(1)* undef
 | |
|   ret void
 | |
| }
 | |
| 
 | |
| ; CHECK: DIVERGENT:  %id.y = call i32 @llvm.amdgcn.workitem.id.y()
 | |
| define amdgpu_kernel void @workitem_id_y() #1 {
 | |
|   %id.y = call i32 @llvm.amdgcn.workitem.id.y()
 | |
|   store volatile i32 %id.y, i32 addrspace(1)* undef
 | |
|   ret void
 | |
| }
 | |
| 
 | |
| ; CHECK: DIVERGENT:  %id.z = call i32 @llvm.amdgcn.workitem.id.z()
 | |
| define amdgpu_kernel void @workitem_id_z() #1 {
 | |
|   %id.z = call i32 @llvm.amdgcn.workitem.id.z()
 | |
|   store volatile i32 %id.z, i32 addrspace(1)* undef
 | |
|   ret void
 | |
| }
 | |
| 
 | |
| ; CHECK: DIVERGENT:  %mbcnt.lo = call i32 @llvm.amdgcn.mbcnt.lo(i32 0, i32 0)
 | |
| define amdgpu_kernel void @mbcnt_lo() #1 {
 | |
|   %mbcnt.lo = call i32 @llvm.amdgcn.mbcnt.lo(i32 0, i32 0)
 | |
|   store volatile i32 %mbcnt.lo, i32 addrspace(1)* undef
 | |
|   ret void
 | |
| }
 | |
| 
 | |
| ; CHECK: DIVERGENT:  %mbcnt.hi = call i32 @llvm.amdgcn.mbcnt.hi(i32 0, i32 0)
 | |
| define amdgpu_kernel void @mbcnt_hi() #1 {
 | |
|   %mbcnt.hi = call i32 @llvm.amdgcn.mbcnt.hi(i32 0, i32 0)
 | |
|   store volatile i32 %mbcnt.hi, i32 addrspace(1)* undef
 | |
|   ret void
 | |
| }
 | |
| 
 | |
| attributes #0 = { nounwind readnone }
 | |
| attributes #1 = { nounwind }
 |