32 lines
		
	
	
		
			1.3 KiB
		
	
	
	
		
			LLVM
		
	
	
	
			
		
		
	
	
			32 lines
		
	
	
		
			1.3 KiB
		
	
	
	
		
			LLVM
		
	
	
	
; RUN: opt < %s -instcombine -S | grep "align 32" | count 2
 | 
						|
 | 
						|
; It's tempting to have an instcombine in which the src pointer of a
 | 
						|
; memcpy is aligned up to the alignment of the destination, however
 | 
						|
; there are pitfalls. If the src is an alloca, aligning it beyond what
 | 
						|
; the target's stack pointer is aligned at will require dynamic
 | 
						|
; stack realignment, which can require functions that don't otherwise
 | 
						|
; need a frame pointer to need one.
 | 
						|
;
 | 
						|
; Abstaining from this transform is not the only way to approach this
 | 
						|
; issue. Some late phase could be smart enough to reduce alloca
 | 
						|
; alignments when they are greater than they need to be. Or, codegen
 | 
						|
; could do dynamic alignment for just the one alloca, and leave the
 | 
						|
; main stack pointer at its standard alignment.
 | 
						|
;
 | 
						|
 | 
						|
 | 
						|
@dst = global [1024 x i8] zeroinitializer, align 32
 | 
						|
 | 
						|
define void @foo() nounwind {
 | 
						|
entry:
 | 
						|
  %src = alloca [1024 x i8], align 1
 | 
						|
  %src1 = getelementptr [1024 x i8], [1024 x i8]* %src, i32 0, i32 0
 | 
						|
  call void @llvm.memcpy.p0i8.p0i8.i32(i8* align 32 getelementptr inbounds ([1024 x i8], [1024 x i8]* @dst, i32 0, i32 0), i8* align 32 %src1, i32 1024, i1 false)
 | 
						|
  call void @frob(i8* %src1) nounwind
 | 
						|
  ret void
 | 
						|
}
 | 
						|
 | 
						|
declare void @frob(i8*)
 | 
						|
 | 
						|
declare void @llvm.memcpy.p0i8.p0i8.i32(i8* nocapture, i8* nocapture, i32, i1) nounwind
 |