43 lines
		
	
	
		
			1.5 KiB
		
	
	
	
		
			LLVM
		
	
	
	
			
		
		
	
	
			43 lines
		
	
	
		
			1.5 KiB
		
	
	
	
		
			LLVM
		
	
	
	
| ; RUN: opt -passes='loop-vectorize' -force-vector-width=2 -S < %s | FileCheck %s
 | |
| ;
 | |
| ; Forcing VF=2 to trigger vector code gen
 | |
| ;
 | |
| ; This is a test case that let's vectorizer's code gen to generate
 | |
| ; more than one BasicBlocks in the loop body (emulated masked scatter)
 | |
| ; for those targets that do not support masked scatter. Broadcast
 | |
| ; code generation was previously dependent on loop body being
 | |
| ; a single basic block and this test case exposed incorrect code gen
 | |
| ; resulting in an assert in IL verification. Test passes if IL verification
 | |
| ; does not fail.
 | |
| ;
 | |
| ; Performing minimal check in the output to ensure the loop is actually
 | |
| ; vectorized.
 | |
| ;
 | |
| ; CHECK: vector.body
 | |
| 
 | |
| @a = external global [2 x i16], align 1
 | |
| 
 | |
| define void @f1() {
 | |
| entry:
 | |
|   br label %for.body
 | |
| 
 | |
| for.body:                                         ; preds = %land.end, %entry
 | |
|   %0 = phi i32 [ undef, %entry ], [ %dec, %land.end ]
 | |
|   br i1 undef, label %land.end, label %land.rhs
 | |
| 
 | |
| land.rhs:                                         ; preds = %for.body
 | |
|   %1 = load i32, i32* undef, align 1
 | |
|   br label %land.end
 | |
| 
 | |
| land.end:                                         ; preds = %land.rhs, %for.body
 | |
|   %2 = trunc i32 %0 to i16
 | |
|   %arrayidx = getelementptr inbounds [2 x i16], [2 x i16]* @a, i16 0, i16 %2
 | |
|   store i16 undef, i16* %arrayidx, align 1
 | |
|   %dec = add nsw i32 %0, -1
 | |
|   %cmp = icmp sgt i32 %0, 1
 | |
|   br i1 %cmp, label %for.body, label %for.cond.for.end_crit_edge
 | |
| 
 | |
| for.cond.for.end_crit_edge:                       ; preds = %land.end
 | |
|   unreachable
 | |
| }
 |