22 lines
		
	
	
		
			866 B
		
	
	
	
		
			LLVM
		
	
	
	
			
		
		
	
	
			22 lines
		
	
	
		
			866 B
		
	
	
	
		
			LLVM
		
	
	
	
| ; RUN: llc -mtriple=amdgcn--amdhsa -mcpu=fiji -mattr=-flat-for-global -relocation-model=static < %s | FileCheck %s
 | |
| 
 | |
| @lds = external addrspace(3) global [4 x i32]
 | |
| 
 | |
| ; Function Attrs: nounwind
 | |
| 
 | |
| ; Offset folding is an optimization done for global variables with relocations,
 | |
| ; which allows you to store the offset in the r_addend of the relocation entry.
 | |
| ; The offset is apllied to the variables address at link time, which eliminates
 | |
| ; the need to emit shader instructions to do this calculation.
 | |
| ; We don't use relocations for local memory, so we should never fold offsets
 | |
| ; for local memory globals.
 | |
| 
 | |
| ; CHECK-LABEL: lds_no_offset:
 | |
| ; CHECK: ds_write_b32 v{{[0-9]+}}, v{{[0-9]+}} offset:4
 | |
| define amdgpu_kernel void @lds_no_offset() {
 | |
| entry:
 | |
|   %ptr = getelementptr [4 x i32], [4 x i32] addrspace(3)* @lds, i32 0, i32 1
 | |
|   store i32 0, i32 addrspace(3)* %ptr
 | |
|   ret void
 | |
| }
 |