79 lines
		
	
	
		
			2.2 KiB
		
	
	
	
		
			LLVM
		
	
	
	
			
		
		
	
	
			79 lines
		
	
	
		
			2.2 KiB
		
	
	
	
		
			LLVM
		
	
	
	
| ; RUN: opt -basicaa -loop-vectorize -force-vector-width=2 \
 | |
| ; RUN:     -force-vector-interleave=1 -S < %s \
 | |
| ; RUN:     | FileCheck %s -check-prefix=BOTH -check-prefix=LV
 | |
| ; RUN: opt -basicaa -scoped-noalias -loop-vectorize -dse -force-vector-width=2 \
 | |
| ; RUN:     -force-vector-interleave=1 -S < %s \
 | |
| ; RUN:     | FileCheck %s -check-prefix=BOTH -check-prefix=DSE
 | |
| 
 | |
| target datalayout = "e-m:o-i64:64-f80:128-n8:16:32:64-S128"
 | |
| 
 | |
| ; This loop needs to be versioned with memchecks between {A, B} x {C} before
 | |
| ; it can be vectorized.
 | |
| ;
 | |
| ;   for (i = 0; i < n; i++) {
 | |
| ;     C[i] = A[i] + 1;
 | |
| ;     C[i] += B[i];
 | |
| ;   }
 | |
| ;
 | |
| ; Check that the corresponding noalias metadata is added to the vector loop
 | |
| ; but not to the scalar loop.
 | |
| ;
 | |
| ; Since in the versioned vector loop C and B can no longer alias, the first
 | |
| ; store to C[i] can be DSE'd.
 | |
| 
 | |
| 
 | |
| define void @f(i32* %a, i32* %b, i32* %c) {
 | |
| entry:
 | |
|   br label %for.body
 | |
| 
 | |
| ; BOTH: vector.memcheck:
 | |
| ; BOTH: vector.body:
 | |
| for.body:                                         ; preds = %for.body, %entry
 | |
|   %ind = phi i64 [ 0, %entry ], [ %inc, %for.body ]
 | |
| 
 | |
|   %arrayidxA = getelementptr inbounds i32, i32* %a, i64 %ind
 | |
| ; Scope 1
 | |
| ; LV: = load {{.*}} !alias.scope !0
 | |
|   %loadA = load i32, i32* %arrayidxA, align 4
 | |
| 
 | |
|   %add = add nuw i32 %loadA, 2
 | |
| 
 | |
|   %arrayidxC = getelementptr inbounds i32, i32* %c, i64 %ind
 | |
| ; Noalias with scope 1 and 6
 | |
| ; LV: store {{.*}} !alias.scope !3, !noalias !5
 | |
| ; DSE-NOT: store
 | |
|   store i32 %add, i32* %arrayidxC, align 4
 | |
| 
 | |
|   %arrayidxB = getelementptr inbounds i32, i32* %b, i64 %ind
 | |
| ; Scope 6
 | |
| ; LV: = load {{.*}} !alias.scope !7
 | |
|   %loadB = load i32, i32* %arrayidxB, align 4
 | |
| 
 | |
|   %add2 = add nuw i32 %add, %loadB
 | |
| 
 | |
| ; Noalias with scope 1 and 6
 | |
| ; LV: store {{.*}} !alias.scope !3, !noalias !5
 | |
| ; DSE: store
 | |
|   store i32 %add2, i32* %arrayidxC, align 4
 | |
| 
 | |
|   %inc = add nuw nsw i64 %ind, 1
 | |
|   %exitcond = icmp eq i64 %inc, 20
 | |
|   br i1 %exitcond, label %for.end, label %for.body
 | |
| 
 | |
| ; BOTH: for.body:
 | |
| ; BOTH-NOT: !alias.scope
 | |
| ; BOTH-NOT: !noalias
 | |
| 
 | |
| for.end:                                          ; preds = %for.body
 | |
|   ret void
 | |
| }
 | |
| 
 | |
| ; LV: !0 = !{!1}
 | |
| ; LV: !1 = distinct !{!1, !2}
 | |
| ; LV: !2 = distinct !{!2, !"LVerDomain"}
 | |
| ; LV: !3 = !{!4}
 | |
| ; LV: !4 = distinct !{!4, !2}
 | |
| ; LV: !5 = !{!1, !6}
 | |
| ; LV: !6 = distinct !{!6, !2}
 | |
| ; LV: !7 = !{!6}
 |