158 lines
		
	
	
		
			7.3 KiB
		
	
	
	
		
			LLVM
		
	
	
	
			
		
		
	
	
			158 lines
		
	
	
		
			7.3 KiB
		
	
	
	
		
			LLVM
		
	
	
	
| ; NOTE: Assertions have been autogenerated by utils/update_test_checks.py
 | |
| ; RUN: opt -instcombine %s -S | FileCheck %s
 | |
| 
 | |
| @block = global [64 x [8192 x i8]] zeroinitializer, align 1
 | |
| 
 | |
| define <2 x i8*> @vectorindex1() {
 | |
| ; CHECK-LABEL: @vectorindex1(
 | |
| ; CHECK-NEXT:    ret <2 x i8*> getelementptr inbounds ([64 x [8192 x i8]], [64 x [8192 x i8]]* @block, <2 x i64> zeroinitializer, <2 x i64> <i64 1, i64 2>, <2 x i64> zeroinitializer)
 | |
| ;
 | |
|   %1 = getelementptr inbounds [64 x [8192 x i8]], [64 x [8192 x i8]]* @block, i64 0, <2 x i64> <i64 0, i64 1>, i64 8192
 | |
|   ret <2 x i8*> %1
 | |
| }
 | |
| 
 | |
| define <2 x i8*> @vectorindex2() {
 | |
| ; CHECK-LABEL: @vectorindex2(
 | |
| ; CHECK-NEXT:    ret <2 x i8*> getelementptr inbounds ([64 x [8192 x i8]], [64 x [8192 x i8]]* @block, <2 x i64> zeroinitializer, <2 x i64> <i64 1, i64 2>, <2 x i64> <i64 8191, i64 1>)
 | |
| ;
 | |
|   %1 = getelementptr inbounds [64 x [8192 x i8]], [64 x [8192 x i8]]* @block, i64 0, i64 1, <2 x i64> <i64 8191, i64 8193>
 | |
|   ret <2 x i8*> %1
 | |
| }
 | |
| 
 | |
| define <2 x i8*> @vectorindex3() {
 | |
| ; CHECK-LABEL: @vectorindex3(
 | |
| ; CHECK-NEXT:    ret <2 x i8*> getelementptr inbounds ([64 x [8192 x i8]], [64 x [8192 x i8]]* @block, <2 x i64> zeroinitializer, <2 x i64> <i64 0, i64 2>, <2 x i64> <i64 8191, i64 1>)
 | |
| ;
 | |
|   %1 = getelementptr inbounds [64 x [8192 x i8]], [64 x [8192 x i8]]* @block, i64 0, <2 x i64> <i64 0, i64 1>, <2 x i64> <i64 8191, i64 8193>
 | |
|   ret <2 x i8*> %1
 | |
| }
 | |
| 
 | |
| ; Negative test - datalayout's alloc size for the 2 types must match.
 | |
| 
 | |
| define i32* @bitcast_vec_to_array_gep(<7 x i32>* %x, i64 %y, i64 %z) {
 | |
| ; CHECK-LABEL: @bitcast_vec_to_array_gep(
 | |
| ; CHECK-NEXT:    [[ARR_PTR:%.*]] = bitcast <7 x i32>* [[X:%.*]] to [7 x i32]*
 | |
| ; CHECK-NEXT:    [[GEP:%.*]] = getelementptr [7 x i32], [7 x i32]* [[ARR_PTR]], i64 [[Y:%.*]], i64 [[Z:%.*]]
 | |
| ; CHECK-NEXT:    ret i32* [[GEP]]
 | |
| ;
 | |
|   %arr_ptr = bitcast <7 x i32>* %x to [7 x i32]*
 | |
|   %gep = getelementptr [7 x i32], [7 x i32]* %arr_ptr, i64 %y, i64 %z
 | |
|   ret i32* %gep
 | |
| }
 | |
| 
 | |
| ; Negative test - datalayout's alloc size for the 2 types must match.
 | |
| 
 | |
| define i32* @bitcast_array_to_vec_gep([3 x i32]* %x, i64 %y, i64 %z) {
 | |
| ; CHECK-LABEL: @bitcast_array_to_vec_gep(
 | |
| ; CHECK-NEXT:    [[VEC_PTR:%.*]] = bitcast [3 x i32]* [[X:%.*]] to <3 x i32>*
 | |
| ; CHECK-NEXT:    [[GEP:%.*]] = getelementptr inbounds <3 x i32>, <3 x i32>* [[VEC_PTR]], i64 [[Y:%.*]], i64 [[Z:%.*]]
 | |
| ; CHECK-NEXT:    ret i32* [[GEP]]
 | |
| ;
 | |
|   %vec_ptr = bitcast [3 x i32]* %x to <3 x i32>*
 | |
|   %gep = getelementptr inbounds <3 x i32>, <3 x i32>* %vec_ptr, i64 %y, i64 %z
 | |
|   ret i32* %gep
 | |
| }
 | |
| 
 | |
| ; Sizes and types match - safe to remove bitcast.
 | |
| 
 | |
| define i32* @bitcast_vec_to_array_gep_matching_alloc_size(<4 x i32>* %x, i64 %y, i64 %z) {
 | |
| ; CHECK-LABEL: @bitcast_vec_to_array_gep_matching_alloc_size(
 | |
| ; CHECK-NEXT:    [[GEP:%.*]] = getelementptr <4 x i32>, <4 x i32>* [[X:%.*]], i64 [[Y:%.*]], i64 [[Z:%.*]]
 | |
| ; CHECK-NEXT:    ret i32* [[GEP]]
 | |
| ;
 | |
|   %arr_ptr = bitcast <4 x i32>* %x to [4 x i32]*
 | |
|   %gep = getelementptr [4 x i32], [4 x i32]* %arr_ptr, i64 %y, i64 %z
 | |
|   ret i32* %gep
 | |
| }
 | |
| 
 | |
| ; Sizes and types match - safe to remove bitcast.
 | |
| 
 | |
| define i32* @bitcast_array_to_vec_gep_matching_alloc_size([4 x i32]* %x, i64 %y, i64 %z) {
 | |
| ; CHECK-LABEL: @bitcast_array_to_vec_gep_matching_alloc_size(
 | |
| ; CHECK-NEXT:    [[GEP:%.*]] = getelementptr inbounds [4 x i32], [4 x i32]* [[X:%.*]], i64 [[Y:%.*]], i64 [[Z:%.*]]
 | |
| ; CHECK-NEXT:    ret i32* [[GEP]]
 | |
| ;
 | |
|   %vec_ptr = bitcast [4 x i32]* %x to <4 x i32>*
 | |
|   %gep = getelementptr inbounds <4 x i32>, <4 x i32>* %vec_ptr, i64 %y, i64 %z
 | |
|   ret i32* %gep
 | |
| }
 | |
| 
 | |
| ; Negative test - datalayout's alloc size for the 2 types must match.
 | |
| 
 | |
| define i32 addrspace(3)* @bitcast_vec_to_array_addrspace(<7 x i32>* %x, i64 %y, i64 %z) {
 | |
| ; CHECK-LABEL: @bitcast_vec_to_array_addrspace(
 | |
| ; CHECK-NEXT:    [[ARR_PTR:%.*]] = bitcast <7 x i32>* [[X:%.*]] to [7 x i32]*
 | |
| ; CHECK-NEXT:    [[ASC:%.*]] = addrspacecast [7 x i32]* [[ARR_PTR]] to [7 x i32] addrspace(3)*
 | |
| ; CHECK-NEXT:    [[GEP:%.*]] = getelementptr [7 x i32], [7 x i32] addrspace(3)* [[ASC]], i64 [[Y:%.*]], i64 [[Z:%.*]]
 | |
| ; CHECK-NEXT:    ret i32 addrspace(3)* [[GEP]]
 | |
| ;
 | |
|   %arr_ptr = bitcast <7 x i32>* %x to [7 x i32]*
 | |
|   %asc = addrspacecast [7 x i32]* %arr_ptr to [7 x i32] addrspace(3)*
 | |
|   %gep = getelementptr [7 x i32], [7 x i32] addrspace(3)* %asc, i64 %y, i64 %z
 | |
|   ret i32 addrspace(3)* %gep
 | |
| }
 | |
| 
 | |
| ; Negative test - datalayout's alloc size for the 2 types must match.
 | |
| 
 | |
| define i32 addrspace(3)* @inbounds_bitcast_vec_to_array_addrspace(<7 x i32>* %x, i64 %y, i64 %z) {
 | |
| ; CHECK-LABEL: @inbounds_bitcast_vec_to_array_addrspace(
 | |
| ; CHECK-NEXT:    [[ARR_PTR:%.*]] = bitcast <7 x i32>* [[X:%.*]] to [7 x i32]*
 | |
| ; CHECK-NEXT:    [[ASC:%.*]] = addrspacecast [7 x i32]* [[ARR_PTR]] to [7 x i32] addrspace(3)*
 | |
| ; CHECK-NEXT:    [[GEP:%.*]] = getelementptr inbounds [7 x i32], [7 x i32] addrspace(3)* [[ASC]], i64 [[Y:%.*]], i64 [[Z:%.*]]
 | |
| ; CHECK-NEXT:    ret i32 addrspace(3)* [[GEP]]
 | |
| ;
 | |
|   %arr_ptr = bitcast <7 x i32>* %x to [7 x i32]*
 | |
|   %asc = addrspacecast [7 x i32]* %arr_ptr to [7 x i32] addrspace(3)*
 | |
|   %gep = getelementptr inbounds [7 x i32], [7 x i32] addrspace(3)* %asc, i64 %y, i64 %z
 | |
|   ret i32 addrspace(3)* %gep
 | |
| }
 | |
| 
 | |
| ; Sizes and types match - safe to remove bitcast.
 | |
| 
 | |
| define i32 addrspace(3)* @bitcast_vec_to_array_addrspace_matching_alloc_size(<4 x i32>* %x, i64 %y, i64 %z) {
 | |
| ; CHECK-LABEL: @bitcast_vec_to_array_addrspace_matching_alloc_size(
 | |
| ; CHECK-NEXT:    [[GEP:%.*]] = getelementptr <4 x i32>, <4 x i32>* [[X:%.*]], i64 [[Y:%.*]], i64 [[Z:%.*]]
 | |
| ; CHECK-NEXT:    [[TMP1:%.*]] = addrspacecast i32* [[GEP]] to i32 addrspace(3)*
 | |
| ; CHECK-NEXT:    ret i32 addrspace(3)* [[TMP1]]
 | |
| ;
 | |
|   %arr_ptr = bitcast <4 x i32>* %x to [4 x i32]*
 | |
|   %asc = addrspacecast [4 x i32]* %arr_ptr to [4 x i32] addrspace(3)*
 | |
|   %gep = getelementptr [4 x i32], [4 x i32] addrspace(3)* %asc, i64 %y, i64 %z
 | |
|   ret i32 addrspace(3)* %gep
 | |
| }
 | |
| 
 | |
| ; Sizes and types match - safe to remove bitcast.
 | |
| 
 | |
| define i32 addrspace(3)* @inbounds_bitcast_vec_to_array_addrspace_matching_alloc_size(<4 x i32>* %x, i64 %y, i64 %z) {
 | |
| ; CHECK-LABEL: @inbounds_bitcast_vec_to_array_addrspace_matching_alloc_size(
 | |
| ; CHECK-NEXT:    [[GEP:%.*]] = getelementptr inbounds <4 x i32>, <4 x i32>* [[X:%.*]], i64 [[Y:%.*]], i64 [[Z:%.*]]
 | |
| ; CHECK-NEXT:    [[TMP1:%.*]] = addrspacecast i32* [[GEP]] to i32 addrspace(3)*
 | |
| ; CHECK-NEXT:    ret i32 addrspace(3)* [[TMP1]]
 | |
| ;
 | |
|   %arr_ptr = bitcast <4 x i32>* %x to [4 x i32]*
 | |
|   %asc = addrspacecast [4 x i32]* %arr_ptr to [4 x i32] addrspace(3)*
 | |
|   %gep = getelementptr inbounds [4 x i32], [4 x i32] addrspace(3)* %asc, i64 %y, i64 %z
 | |
|   ret i32 addrspace(3)* %gep
 | |
| }
 | |
| 
 | |
| ; Negative test - avoid doing bitcast on i8*, because '16' should be scaled by 'vscale'.
 | |
| 
 | |
| define i8* @test_accumulate_constant_offset_vscale_nonzero(<vscale x 16 x i1> %pg, i8* %base) {
 | |
| ; CHECK-LABEL: @test_accumulate_constant_offset_vscale_nonzero
 | |
| ; CHECK-NEXT:   %bc = bitcast i8* %base to <vscale x 16 x i8>*
 | |
| ; CHECK-NEXT:   %gep = getelementptr <vscale x 16 x i8>, <vscale x 16 x i8>* %bc, i64 1, i64 4
 | |
| ; CHECK-NEXT:   ret i8* %gep
 | |
|   %bc = bitcast i8* %base to <vscale x 16 x i8>*
 | |
|   %gep = getelementptr <vscale x 16 x i8>, <vscale x 16 x i8>* %bc, i64 1, i64 4
 | |
|   ret i8* %gep
 | |
| }
 | |
| 
 | |
| define i8* @test_accumulate_constant_offset_vscale_zero(<vscale x 16 x i1> %pg, i8* %base) {
 | |
| ; CHECK-LABEL: @test_accumulate_constant_offset_vscale_zero
 | |
| ; CHECK-NEXT:   %[[RES:.*]] = getelementptr i8, i8* %base, i64 4
 | |
| ; CHECK-NEXT:   ret i8* %[[RES]]
 | |
|   %bc = bitcast i8* %base to <vscale x 16 x i8>*
 | |
|   %gep = getelementptr <vscale x 16 x i8>, <vscale x 16 x i8>* %bc, i64 0, i64 4
 | |
|   ret i8* %gep
 | |
| }
 |