246 lines
		
	
	
		
			11 KiB
		
	
	
	
		
			LLVM
		
	
	
	
			
		
		
	
	
			246 lines
		
	
	
		
			11 KiB
		
	
	
	
		
			LLVM
		
	
	
	
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py
 | 
						|
; RUN: opt -S -memcpyopt < %s -enable-memcpyopt-memoryssa=0 | FileCheck %s --check-prefixes=CHECK,NO_MSSA
 | 
						|
; RUN: opt -S -memcpyopt < %s -enable-memcpyopt-memoryssa=1 -verify-memoryssa | FileCheck %s --check-prefixes=CHECK,MSSA
 | 
						|
 | 
						|
define i8 @read_dest_between_call_and_memcpy() {
 | 
						|
; CHECK-LABEL: @read_dest_between_call_and_memcpy(
 | 
						|
; CHECK-NEXT:    [[DEST:%.*]] = alloca [16 x i8], align 1
 | 
						|
; CHECK-NEXT:    [[SRC:%.*]] = alloca [16 x i8], align 1
 | 
						|
; CHECK-NEXT:    [[DEST_I8:%.*]] = bitcast [16 x i8]* [[DEST]] to i8*
 | 
						|
; CHECK-NEXT:    [[SRC_I8:%.*]] = bitcast [16 x i8]* [[SRC]] to i8*
 | 
						|
; CHECK-NEXT:    store i8 1, i8* [[DEST_I8]], align 1
 | 
						|
; CHECK-NEXT:    call void @llvm.memset.p0i8.i64(i8* [[SRC_I8]], i8 0, i64 16, i1 false)
 | 
						|
; CHECK-NEXT:    [[X:%.*]] = load i8, i8* [[DEST_I8]], align 1
 | 
						|
; CHECK-NEXT:    call void @llvm.memset.p0i8.i64(i8* [[DEST_I8]], i8 0, i64 16, i1 false)
 | 
						|
; CHECK-NEXT:    ret i8 [[X]]
 | 
						|
;
 | 
						|
  %dest = alloca [16 x i8]
 | 
						|
  %src = alloca [16 x i8]
 | 
						|
  %dest.i8 = bitcast [16 x i8]* %dest to i8*
 | 
						|
  %src.i8 = bitcast [16 x i8]* %src to i8*
 | 
						|
  store i8 1, i8* %dest.i8
 | 
						|
  call void @llvm.memset.p0i8.i64(i8* %src.i8, i8 0, i64 16, i1 false)
 | 
						|
  %x = load i8, i8* %dest.i8
 | 
						|
  call void @llvm.memcpy.p0i8.p0i8.i64(i8* %dest.i8, i8* %src.i8, i64 16, i1 false)
 | 
						|
  ret i8 %x
 | 
						|
}
 | 
						|
 | 
						|
define i8 @read_src_between_call_and_memcpy() {
 | 
						|
; NO_MSSA-LABEL: @read_src_between_call_and_memcpy(
 | 
						|
; NO_MSSA-NEXT:    [[DEST:%.*]] = alloca [16 x i8], align 1
 | 
						|
; NO_MSSA-NEXT:    [[SRC:%.*]] = alloca [16 x i8], align 1
 | 
						|
; NO_MSSA-NEXT:    [[DEST_I8:%.*]] = bitcast [16 x i8]* [[DEST]] to i8*
 | 
						|
; NO_MSSA-NEXT:    [[SRC_I8:%.*]] = bitcast [16 x i8]* [[SRC]] to i8*
 | 
						|
; NO_MSSA-NEXT:    call void @llvm.memset.p0i8.i64(i8* [[SRC_I8]], i8 0, i64 16, i1 false)
 | 
						|
; NO_MSSA-NEXT:    [[X:%.*]] = load i8, i8* [[SRC_I8]], align 1
 | 
						|
; NO_MSSA-NEXT:    call void @llvm.memcpy.p0i8.p0i8.i64(i8* [[DEST_I8]], i8* [[SRC_I8]], i64 16, i1 false)
 | 
						|
; NO_MSSA-NEXT:    ret i8 [[X]]
 | 
						|
;
 | 
						|
; MSSA-LABEL: @read_src_between_call_and_memcpy(
 | 
						|
; MSSA-NEXT:    [[DEST:%.*]] = alloca [16 x i8], align 1
 | 
						|
; MSSA-NEXT:    [[SRC:%.*]] = alloca [16 x i8], align 1
 | 
						|
; MSSA-NEXT:    [[DEST_I8:%.*]] = bitcast [16 x i8]* [[DEST]] to i8*
 | 
						|
; MSSA-NEXT:    [[SRC_I8:%.*]] = bitcast [16 x i8]* [[SRC]] to i8*
 | 
						|
; MSSA-NEXT:    call void @llvm.memset.p0i8.i64(i8* [[SRC_I8]], i8 0, i64 16, i1 false)
 | 
						|
; MSSA-NEXT:    [[X:%.*]] = load i8, i8* [[SRC_I8]], align 1
 | 
						|
; MSSA-NEXT:    call void @llvm.memset.p0i8.i64(i8* [[DEST_I8]], i8 0, i64 16, i1 false)
 | 
						|
; MSSA-NEXT:    ret i8 [[X]]
 | 
						|
;
 | 
						|
  %dest = alloca [16 x i8]
 | 
						|
  %src = alloca [16 x i8]
 | 
						|
  %dest.i8 = bitcast [16 x i8]* %dest to i8*
 | 
						|
  %src.i8 = bitcast [16 x i8]* %src to i8*
 | 
						|
  call void @llvm.memset.p0i8.i64(i8* %src.i8, i8 0, i64 16, i1 false)
 | 
						|
  %x = load i8, i8* %src.i8
 | 
						|
  call void @llvm.memcpy.p0i8.p0i8.i64(i8* %dest.i8, i8* %src.i8, i64 16, i1 false)
 | 
						|
  ret i8 %x
 | 
						|
}
 | 
						|
 | 
						|
define void @write_dest_between_call_and_memcpy() {
 | 
						|
; CHECK-LABEL: @write_dest_between_call_and_memcpy(
 | 
						|
; CHECK-NEXT:    [[DEST:%.*]] = alloca [16 x i8], align 1
 | 
						|
; CHECK-NEXT:    [[SRC:%.*]] = alloca [16 x i8], align 1
 | 
						|
; CHECK-NEXT:    [[DEST_I8:%.*]] = bitcast [16 x i8]* [[DEST]] to i8*
 | 
						|
; CHECK-NEXT:    [[SRC_I8:%.*]] = bitcast [16 x i8]* [[SRC]] to i8*
 | 
						|
; CHECK-NEXT:    call void @llvm.memset.p0i8.i64(i8* [[SRC_I8]], i8 0, i64 16, i1 false)
 | 
						|
; CHECK-NEXT:    store i8 1, i8* [[DEST_I8]], align 1
 | 
						|
; CHECK-NEXT:    call void @llvm.memset.p0i8.i64(i8* [[DEST_I8]], i8 0, i64 16, i1 false)
 | 
						|
; CHECK-NEXT:    ret void
 | 
						|
;
 | 
						|
  %dest = alloca [16 x i8]
 | 
						|
  %src = alloca [16 x i8]
 | 
						|
  %dest.i8 = bitcast [16 x i8]* %dest to i8*
 | 
						|
  %src.i8 = bitcast [16 x i8]* %src to i8*
 | 
						|
  call void @llvm.memset.p0i8.i64(i8* %src.i8, i8 0, i64 16, i1 false)
 | 
						|
  store i8 1, i8* %dest.i8
 | 
						|
  call void @llvm.memcpy.p0i8.p0i8.i64(i8* %dest.i8, i8* %src.i8, i64 16, i1 false)
 | 
						|
  ret void
 | 
						|
}
 | 
						|
 | 
						|
define void @write_src_between_call_and_memcpy() {
 | 
						|
; CHECK-LABEL: @write_src_between_call_and_memcpy(
 | 
						|
; CHECK-NEXT:    [[DEST:%.*]] = alloca [16 x i8], align 1
 | 
						|
; CHECK-NEXT:    [[SRC:%.*]] = alloca [16 x i8], align 1
 | 
						|
; CHECK-NEXT:    [[DEST_I8:%.*]] = bitcast [16 x i8]* [[DEST]] to i8*
 | 
						|
; CHECK-NEXT:    [[SRC_I8:%.*]] = bitcast [16 x i8]* [[SRC]] to i8*
 | 
						|
; CHECK-NEXT:    call void @llvm.memset.p0i8.i64(i8* [[SRC_I8]], i8 0, i64 16, i1 false)
 | 
						|
; CHECK-NEXT:    store i8 1, i8* [[SRC_I8]], align 1
 | 
						|
; CHECK-NEXT:    call void @llvm.memcpy.p0i8.p0i8.i64(i8* [[DEST_I8]], i8* [[SRC_I8]], i64 16, i1 false)
 | 
						|
; CHECK-NEXT:    ret void
 | 
						|
;
 | 
						|
  %dest = alloca [16 x i8]
 | 
						|
  %src = alloca [16 x i8]
 | 
						|
  %dest.i8 = bitcast [16 x i8]* %dest to i8*
 | 
						|
  %src.i8 = bitcast [16 x i8]* %src to i8*
 | 
						|
  call void @llvm.memset.p0i8.i64(i8* %src.i8, i8 0, i64 16, i1 false)
 | 
						|
  store i8 1, i8* %src.i8
 | 
						|
  call void @llvm.memcpy.p0i8.p0i8.i64(i8* %dest.i8, i8* %src.i8, i64 16, i1 false)
 | 
						|
  ret void
 | 
						|
}
 | 
						|
 | 
						|
define void @throw_between_call_and_mempy(i8* dereferenceable(16) %dest.i8) {
 | 
						|
; CHECK-LABEL: @throw_between_call_and_mempy(
 | 
						|
; CHECK-NEXT:    [[SRC:%.*]] = alloca [16 x i8], align 1
 | 
						|
; CHECK-NEXT:    [[SRC_I8:%.*]] = bitcast [16 x i8]* [[SRC]] to i8*
 | 
						|
; CHECK-NEXT:    call void @llvm.memset.p0i8.i64(i8* [[SRC_I8]], i8 0, i64 16, i1 false)
 | 
						|
; CHECK-NEXT:    call void @may_throw() [[ATTR2:#.*]]
 | 
						|
; CHECK-NEXT:    call void @llvm.memset.p0i8.i64(i8* [[DEST_I8:%.*]], i8 0, i64 16, i1 false)
 | 
						|
; CHECK-NEXT:    ret void
 | 
						|
;
 | 
						|
  %src = alloca [16 x i8]
 | 
						|
  %src.i8 = bitcast [16 x i8]* %src to i8*
 | 
						|
  call void @llvm.memset.p0i8.i64(i8* %src.i8, i8 0, i64 16, i1 false)
 | 
						|
  call void @may_throw() readnone
 | 
						|
  call void @llvm.memcpy.p0i8.p0i8.i64(i8* %dest.i8, i8* %src.i8, i64 16, i1 false)
 | 
						|
  ret void
 | 
						|
}
 | 
						|
 | 
						|
define void @dest_is_gep_nounwind_call() {
 | 
						|
; CHECK-LABEL: @dest_is_gep_nounwind_call(
 | 
						|
; CHECK-NEXT:    [[DEST:%.*]] = alloca [16 x i8], align 1
 | 
						|
; CHECK-NEXT:    [[SRC:%.*]] = alloca [8 x i8], align 1
 | 
						|
; CHECK-NEXT:    [[SRC_I8:%.*]] = bitcast [8 x i8]* [[SRC]] to i8*
 | 
						|
; CHECK-NEXT:    [[DEST_I8:%.*]] = getelementptr [16 x i8], [16 x i8]* [[DEST]], i64 0, i64 8
 | 
						|
; CHECK-NEXT:    [[DEST_I81:%.*]] = bitcast i8* [[DEST_I8]] to [8 x i8]*
 | 
						|
; CHECK-NEXT:    [[DEST_I812:%.*]] = bitcast [8 x i8]* [[DEST_I81]] to i8*
 | 
						|
; CHECK-NEXT:    call void @accept_ptr(i8* [[DEST_I812]]) [[ATTR3:#.*]]
 | 
						|
; CHECK-NEXT:    ret void
 | 
						|
;
 | 
						|
  %dest = alloca [16 x i8]
 | 
						|
  %src = alloca [8 x i8]
 | 
						|
  %src.i8 = bitcast [8 x i8]* %src to i8*
 | 
						|
  %dest.i8 = getelementptr [16 x i8], [16 x i8]* %dest, i64 0, i64 8
 | 
						|
  call void @accept_ptr(i8* %src.i8) nounwind
 | 
						|
  call void @llvm.memcpy.p0i8.p0i8.i64(i8* %dest.i8, i8* %src.i8, i64 8, i1 false)
 | 
						|
  ret void
 | 
						|
}
 | 
						|
 | 
						|
define void @dest_is_gep_may_throw_call() {
 | 
						|
; CHECK-LABEL: @dest_is_gep_may_throw_call(
 | 
						|
; CHECK-NEXT:    [[DEST:%.*]] = alloca [16 x i8], align 1
 | 
						|
; CHECK-NEXT:    [[SRC:%.*]] = alloca [8 x i8], align 1
 | 
						|
; CHECK-NEXT:    [[SRC_I8:%.*]] = bitcast [8 x i8]* [[SRC]] to i8*
 | 
						|
; CHECK-NEXT:    [[DEST_I8:%.*]] = getelementptr [16 x i8], [16 x i8]* [[DEST]], i64 0, i64 8
 | 
						|
; CHECK-NEXT:    [[DEST_I81:%.*]] = bitcast i8* [[DEST_I8]] to [8 x i8]*
 | 
						|
; CHECK-NEXT:    [[DEST_I812:%.*]] = bitcast [8 x i8]* [[DEST_I81]] to i8*
 | 
						|
; CHECK-NEXT:    call void @accept_ptr(i8* [[DEST_I812]])
 | 
						|
; CHECK-NEXT:    ret void
 | 
						|
;
 | 
						|
  %dest = alloca [16 x i8]
 | 
						|
  %src = alloca [8 x i8]
 | 
						|
  %src.i8 = bitcast [8 x i8]* %src to i8*
 | 
						|
  %dest.i8 = getelementptr [16 x i8], [16 x i8]* %dest, i64 0, i64 8
 | 
						|
  call void @accept_ptr(i8* %src.i8)
 | 
						|
  call void @llvm.memcpy.p0i8.p0i8.i64(i8* %dest.i8, i8* %src.i8, i64 8, i1 false)
 | 
						|
  ret void
 | 
						|
}
 | 
						|
 | 
						|
define void @dest_is_gep_requires_movement() {
 | 
						|
; CHECK-LABEL: @dest_is_gep_requires_movement(
 | 
						|
; CHECK-NEXT:    [[DEST:%.*]] = alloca [16 x i8], align 1
 | 
						|
; CHECK-NEXT:    [[SRC:%.*]] = alloca [8 x i8], align 1
 | 
						|
; CHECK-NEXT:    [[SRC_I8:%.*]] = bitcast [8 x i8]* [[SRC]] to i8*
 | 
						|
; CHECK-NEXT:    [[DEST_I8:%.*]] = getelementptr [16 x i8], [16 x i8]* [[DEST]], i64 0, i64 8
 | 
						|
; CHECK-NEXT:    [[DEST_I81:%.*]] = bitcast i8* [[DEST_I8]] to [8 x i8]*
 | 
						|
; CHECK-NEXT:    [[DEST_I812:%.*]] = bitcast [8 x i8]* [[DEST_I81]] to i8*
 | 
						|
; CHECK-NEXT:    call void @accept_ptr(i8* [[DEST_I812]]) [[ATTR3]]
 | 
						|
; CHECK-NEXT:    ret void
 | 
						|
;
 | 
						|
  %dest = alloca [16 x i8]
 | 
						|
  %src = alloca [8 x i8]
 | 
						|
  %src.i8 = bitcast [8 x i8]* %src to i8*
 | 
						|
  call void @accept_ptr(i8* %src.i8) nounwind
 | 
						|
  %dest.i8 = getelementptr [16 x i8], [16 x i8]* %dest, i64 0, i64 8
 | 
						|
  call void @llvm.memcpy.p0i8.p0i8.i64(i8* %dest.i8, i8* %src.i8, i64 8, i1 false)
 | 
						|
  ret void
 | 
						|
}
 | 
						|
 | 
						|
define void @capture_before_call_argmemonly() {
 | 
						|
; CHECK-LABEL: @capture_before_call_argmemonly(
 | 
						|
; CHECK-NEXT:    [[DEST:%.*]] = alloca [16 x i8], align 1
 | 
						|
; CHECK-NEXT:    [[SRC:%.*]] = alloca [16 x i8], align 1
 | 
						|
; CHECK-NEXT:    [[DEST_I8:%.*]] = bitcast [16 x i8]* [[DEST]] to i8*
 | 
						|
; CHECK-NEXT:    [[SRC_I8:%.*]] = bitcast [16 x i8]* [[SRC]] to i8*
 | 
						|
; CHECK-NEXT:    call void @accept_ptr(i8* [[DEST_I8]])
 | 
						|
; CHECK-NEXT:    [[DEST1:%.*]] = bitcast [16 x i8]* [[DEST]] to i8*
 | 
						|
; CHECK-NEXT:    call void @accept_ptr(i8* [[DEST1]]) [[ATTR4:#.*]]
 | 
						|
; CHECK-NEXT:    ret void
 | 
						|
;
 | 
						|
  %dest = alloca [16 x i8]
 | 
						|
  %src = alloca [16 x i8]
 | 
						|
  %dest.i8 = bitcast [16 x i8]* %dest to i8*
 | 
						|
  %src.i8 = bitcast [16 x i8]* %src to i8*
 | 
						|
  call void @accept_ptr(i8* %dest.i8) ; capture
 | 
						|
  call void @accept_ptr(i8* %src.i8) argmemonly
 | 
						|
  call void @llvm.memcpy.p0i8.p0i8.i64(i8* %dest.i8, i8* %src.i8, i64 16, i1 false)
 | 
						|
  ret void
 | 
						|
}
 | 
						|
 | 
						|
define void @capture_before_call_argmemonly_nounwind() {
 | 
						|
; CHECK-LABEL: @capture_before_call_argmemonly_nounwind(
 | 
						|
; CHECK-NEXT:    [[DEST:%.*]] = alloca [16 x i8], align 1
 | 
						|
; CHECK-NEXT:    [[SRC:%.*]] = alloca [16 x i8], align 1
 | 
						|
; CHECK-NEXT:    [[DEST_I8:%.*]] = bitcast [16 x i8]* [[DEST]] to i8*
 | 
						|
; CHECK-NEXT:    [[SRC_I8:%.*]] = bitcast [16 x i8]* [[SRC]] to i8*
 | 
						|
; CHECK-NEXT:    call void @accept_ptr(i8* [[DEST_I8]])
 | 
						|
; CHECK-NEXT:    [[DEST1:%.*]] = bitcast [16 x i8]* [[DEST]] to i8*
 | 
						|
; CHECK-NEXT:    call void @accept_ptr(i8* [[DEST1]]) [[ATTR5:#.*]]
 | 
						|
; CHECK-NEXT:    ret void
 | 
						|
;
 | 
						|
  %dest = alloca [16 x i8]
 | 
						|
  %src = alloca [16 x i8]
 | 
						|
  %dest.i8 = bitcast [16 x i8]* %dest to i8*
 | 
						|
  %src.i8 = bitcast [16 x i8]* %src to i8*
 | 
						|
  call void @accept_ptr(i8* %dest.i8) ; capture
 | 
						|
  ; NB: argmemonly currently implies willreturn.
 | 
						|
  call void @accept_ptr(i8* %src.i8) argmemonly nounwind
 | 
						|
  call void @llvm.memcpy.p0i8.p0i8.i64(i8* %dest.i8, i8* %src.i8, i64 16, i1 false)
 | 
						|
  ret void
 | 
						|
}
 | 
						|
 | 
						|
define void @capture_before_call_argmemonly_nounwind_willreturn() {
 | 
						|
; CHECK-LABEL: @capture_before_call_argmemonly_nounwind_willreturn(
 | 
						|
; CHECK-NEXT:    [[DEST:%.*]] = alloca [16 x i8], align 1
 | 
						|
; CHECK-NEXT:    [[SRC:%.*]] = alloca [16 x i8], align 1
 | 
						|
; CHECK-NEXT:    [[DEST_I8:%.*]] = bitcast [16 x i8]* [[DEST]] to i8*
 | 
						|
; CHECK-NEXT:    [[SRC_I8:%.*]] = bitcast [16 x i8]* [[SRC]] to i8*
 | 
						|
; CHECK-NEXT:    call void @accept_ptr(i8* [[DEST_I8]])
 | 
						|
; CHECK-NEXT:    [[DEST1:%.*]] = bitcast [16 x i8]* [[DEST]] to i8*
 | 
						|
; CHECK-NEXT:    call void @accept_ptr(i8* [[DEST1]]) [[ATTR0:#.*]]
 | 
						|
; CHECK-NEXT:    ret void
 | 
						|
;
 | 
						|
  %dest = alloca [16 x i8]
 | 
						|
  %src = alloca [16 x i8]
 | 
						|
  %dest.i8 = bitcast [16 x i8]* %dest to i8*
 | 
						|
  %src.i8 = bitcast [16 x i8]* %src to i8*
 | 
						|
  call void @accept_ptr(i8* %dest.i8) ; capture
 | 
						|
  call void @accept_ptr(i8* %src.i8) argmemonly nounwind willreturn
 | 
						|
  call void @llvm.memcpy.p0i8.p0i8.i64(i8* %dest.i8, i8* %src.i8, i64 16, i1 false)
 | 
						|
  ret void
 | 
						|
}
 | 
						|
 | 
						|
declare void @may_throw()
 | 
						|
declare void @accept_ptr(i8*)
 | 
						|
declare void @llvm.memcpy.p0i8.p0i8.i64(i8*, i8*, i64, i1)
 | 
						|
declare void @llvm.memset.p0i8.i64(i8*, i8, i64, i1)
 |