7121 lines
		
	
	
		
			477 KiB
		
	
	
	
		
			LLVM
		
	
	
	
			
		
		
	
	
			7121 lines
		
	
	
		
			477 KiB
		
	
	
	
		
			LLVM
		
	
	
	
| ; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --function-signature --include-generated-funcs
 | |
| ; RUN: opt -S -attributor -openmp-opt-cgscc -openmp-opt-enable-merging -enable-new-pm=0 < %s | FileCheck %s --check-prefix=CHECK1
 | |
| ; RUN: opt -S -aa-pipeline= -passes='attributor,cgscc(openmp-opt-cgscc)' -openmp-opt-enable-merging  < %s | FileCheck %s --check-prefix=CHECK2
 | |
| ; #include <omp.h>
 | |
| ; void foo();
 | |
| ; void use(int);
 | |
| ; void usef(float);
 | |
| ; void merge(int a) {
 | |
| ; #pragma omp parallel
 | |
| ;     {
 | |
| ;         use(a);
 | |
| ;     }
 | |
| ; #pragma omp parallel
 | |
| ;     {
 | |
| ;         use(a);
 | |
| ;     }
 | |
| ; }
 | |
| ; void unmergable_proc_bind(int a) {
 | |
| ; #pragma omp parallel proc_bind(close)
 | |
| ;     {
 | |
| ;         use(a);
 | |
| ;     }
 | |
| ; #pragma omp parallel
 | |
| ;     {
 | |
| ;         use(a);
 | |
| ;     }
 | |
| ; }
 | |
| ; void unmergable_num_threads(int a) {
 | |
| ; #pragma omp parallel num_threads(a)
 | |
| ;     {
 | |
| ;         use(a);
 | |
| ;     }
 | |
| ; #pragma omp parallel
 | |
| ;     {
 | |
| ;         use(a);
 | |
| ;     }
 | |
| ; }
 | |
| ; void unmergable_seq_call(int a) {
 | |
| ; #pragma omp parallel
 | |
| ;     {
 | |
| ;         use(a);
 | |
| ;     }
 | |
| ;     foo();
 | |
| ; #pragma omp parallel
 | |
| ;     {
 | |
| ;         use(a);
 | |
| ;     }
 | |
| ; }
 | |
| ; void merge_seq(int a) {
 | |
| ; #pragma omp parallel
 | |
| ;     {
 | |
| ;         use(a);
 | |
| ;     }
 | |
| ;     a = a + 1;
 | |
| ; #pragma omp parallel
 | |
| ;     {
 | |
| ;         use(a);
 | |
| ;     }
 | |
| ;     use(a);
 | |
| ; }
 | |
| ; void merge_seq_float(float f, float *p) {
 | |
| ; #pragma omp parallel
 | |
| ;     {
 | |
| ;         use(f);
 | |
| ;     }
 | |
| ;     *p = f + 3.14f;
 | |
| ; #pragma omp parallel
 | |
| ;     {
 | |
| ;         use(f);
 | |
| ;     }
 | |
| ; }
 | |
| ; void merge_seq_firstprivate(int a) {
 | |
| ; #pragma omp parallel
 | |
| ;     {
 | |
| ;         use(a);
 | |
| ;     }
 | |
| ;     a = a + 1;
 | |
| ; #pragma omp parallel firstprivate(a)
 | |
| ;     {
 | |
| ;         use(a);
 | |
| ;     }
 | |
| ;     use(a);
 | |
| ; }
 | |
| ; void merge_seq_sink_lt(int a) {
 | |
| ; #pragma omp parallel
 | |
| ;     {
 | |
| ;         use(a);
 | |
| ;     }
 | |
| ;     {
 | |
| ;         int b = (int)&b;
 | |
| ;     }
 | |
| ; #pragma omp parallel
 | |
| ;     {
 | |
| ;         use(a);
 | |
| ;     }
 | |
| ; }
 | |
| ; void merge_seq_par_use(int a) {
 | |
| ; #pragma omp parallel
 | |
| ;     {
 | |
| ;         use(a);
 | |
| ;     }
 | |
| ;     int b = a + 1;
 | |
| ; #pragma omp parallel
 | |
| ;     {
 | |
| ;         use(a);
 | |
| ;         use(b);
 | |
| ;     }
 | |
| ; }
 | |
| ; void merge_cancellable_regions(int cancel1, int cancel2)
 | |
| ; {
 | |
| ; #pragma omp parallel
 | |
| ;     {
 | |
| ;         if(cancel1) {
 | |
| ; #pragma omp cancel parallel
 | |
| ;         }
 | |
| ;     }
 | |
| ; #pragma omp parallel
 | |
| ;     {
 | |
| ;         if (cancel2) {
 | |
| ; #pragma omp cancel parallel
 | |
| ;         }
 | |
| ;     }
 | |
| ; }
 | |
| ; void merge_cancellable_regions_seq(int cancel1, int cancel2)
 | |
| ; {
 | |
| ; #pragma omp parallel
 | |
| ;     {
 | |
| ;         if(cancel1) {
 | |
| ; #pragma omp cancel parallel
 | |
| ;         }
 | |
| ;     }
 | |
| ;     cancel2 = !cancel1;
 | |
| ; #pragma omp parallel
 | |
| ;     {
 | |
| ;         if (cancel2) {
 | |
| ; #pragma omp cancel parallel
 | |
| ;         }
 | |
| ;     }
 | |
| ; }
 | |
| ; void merge_3(int a) {
 | |
| ; #pragma omp parallel
 | |
| ;     {
 | |
| ;         use(a);
 | |
| ;     }
 | |
| ; #pragma omp parallel
 | |
| ;     {
 | |
| ;         use(a);
 | |
| ;     }
 | |
| ; #pragma omp parallel
 | |
| ;     {
 | |
| ;         use(a);
 | |
| ;     }
 | |
| ; }
 | |
| ; void merge_3_seq(int a, int b) {
 | |
| ; #pragma omp parallel
 | |
| ;     {
 | |
| ;         use(a);
 | |
| ;     }
 | |
| ;     b = a + 1;
 | |
| ; #pragma omp parallel
 | |
| ;     {
 | |
| ;         use(a);
 | |
| ;     }
 | |
| ;     b = b + a;
 | |
| ; #pragma omp parallel
 | |
| ;     {
 | |
| ;         use(a);
 | |
| ;     }
 | |
| ;     use(b);
 | |
| ; }
 | |
| ; void unmergable_3_seq_call(int a) {
 | |
| ; #pragma omp parallel
 | |
| ;     {
 | |
| ;         use(a);
 | |
| ;     }
 | |
| ;     foo();
 | |
| ; #pragma omp parallel
 | |
| ;     {
 | |
| ;         use(a);
 | |
| ;     }
 | |
| ;     foo();
 | |
| ; #pragma omp parallel
 | |
| ;     {
 | |
| ;         use(a);
 | |
| ;     }
 | |
| ; }
 | |
| ; void unmergable_3_proc_bind(int a) {
 | |
| ; #pragma omp parallel
 | |
| ;     {
 | |
| ;         use(a);
 | |
| ;     }
 | |
| ; #pragma omp parallel proc_bind(close)
 | |
| ;     {
 | |
| ;         use(a);
 | |
| ;     }
 | |
| ; #pragma omp parallel
 | |
| ;     {
 | |
| ;         use(a);
 | |
| ;     }
 | |
| ; }
 | |
| ; void unmergable_3_num_threads(int a) {
 | |
| ; #pragma omp parallel
 | |
| ;     {
 | |
| ;         use(a);
 | |
| ;     }
 | |
| ; #pragma omp parallel num_threads(a)
 | |
| ;     {
 | |
| ;         use(a);
 | |
| ;     }
 | |
| ; #pragma omp parallel
 | |
| ;     {
 | |
| ;         use(a);
 | |
| ;     }
 | |
| ; }
 | |
| ; void merge_2_unmergable_1(int a) {
 | |
| ; #pragma omp parallel
 | |
| ;     {
 | |
| ;         use(a);
 | |
| ;     }
 | |
| ; #pragma omp parallel
 | |
| ;     {
 | |
| ;         use(a);
 | |
| ;     }
 | |
| ;     foo();
 | |
| ; #pragma omp parallel
 | |
| ;     {
 | |
| ;         use(a);
 | |
| ;     }
 | |
| ; }
 | |
| target datalayout = "e-m:e-p270:32:32-p271:32:32-p272:64:64-i64:64-f80:128-n8:16:32:64-S128"
 | |
| 
 | |
| %struct.ident_t = type { i32, i32, i32, i32, i8* }
 | |
| 
 | |
| @0 = private unnamed_addr constant [23 x i8] c";unknown;unknown;0;0;;\00", align 1
 | |
| @1 = private unnamed_addr constant %struct.ident_t { i32 0, i32 2, i32 0, i32 0, i8* getelementptr inbounds ([23 x i8], [23 x i8]* @0, i32 0, i32 0) }, align 8
 | |
| 
 | |
| define dso_local void @merge(i32 %a) local_unnamed_addr  {
 | |
| entry:
 | |
|   %a.addr = alloca i32, align 4
 | |
|   store i32 %a, i32* %a.addr, align 4
 | |
|   call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* nonnull @1, i32 1, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*)* @.omp_outlined. to void (i32*, i32*, ...)*), i32* nonnull %a.addr)
 | |
|   call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* nonnull @1, i32 1, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*)* @.omp_outlined..1 to void (i32*, i32*, ...)*), i32* nonnull %a.addr)
 | |
|   ret void
 | |
| }
 | |
| 
 | |
| define internal void @.omp_outlined.(i32* noalias nocapture readnone %.global_tid., i32* noalias nocapture readnone %.bound_tid., i32* nocapture nonnull readonly align 4 dereferenceable(4) %a)  {
 | |
| entry:
 | |
|   %0 = load i32, i32* %a, align 4
 | |
|   call void @use(i32 %0)
 | |
|   ret void
 | |
| }
 | |
| 
 | |
| declare dso_local void @use(i32) local_unnamed_addr
 | |
| 
 | |
| declare !callback !1 void @__kmpc_fork_call(%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) local_unnamed_addr
 | |
| 
 | |
| define internal void @.omp_outlined..1(i32* noalias nocapture readnone %.global_tid., i32* noalias nocapture readnone %.bound_tid., i32* nocapture nonnull readonly align 4 dereferenceable(4) %a)  {
 | |
| entry:
 | |
|   %0 = load i32, i32* %a, align 4
 | |
|   call void @use(i32 %0)
 | |
|   ret void
 | |
| }
 | |
| 
 | |
| define dso_local void @unmergable_proc_bind(i32 %a) local_unnamed_addr  {
 | |
| entry:
 | |
|   %a.addr = alloca i32, align 4
 | |
|   %0 = call i32 @__kmpc_global_thread_num(%struct.ident_t* nonnull @1)
 | |
|   store i32 %a, i32* %a.addr, align 4
 | |
|   call void @__kmpc_push_proc_bind(%struct.ident_t* nonnull @1, i32 %0, i32 3)
 | |
|   call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* nonnull @1, i32 1, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*)* @.omp_outlined..2 to void (i32*, i32*, ...)*), i32* nonnull %a.addr)
 | |
|   call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* nonnull @1, i32 1, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*)* @.omp_outlined..3 to void (i32*, i32*, ...)*), i32* nonnull %a.addr)
 | |
|   ret void
 | |
| }
 | |
| 
 | |
| define internal void @.omp_outlined..2(i32* noalias nocapture readnone %.global_tid., i32* noalias nocapture readnone %.bound_tid., i32* nocapture nonnull readonly align 4 dereferenceable(4) %a)  {
 | |
| entry:
 | |
|   %0 = load i32, i32* %a, align 4
 | |
|   call void @use(i32 %0)
 | |
|   ret void
 | |
| }
 | |
| 
 | |
| declare i32 @__kmpc_global_thread_num(%struct.ident_t*) local_unnamed_addr
 | |
| 
 | |
| declare void @__kmpc_push_proc_bind(%struct.ident_t*, i32, i32) local_unnamed_addr
 | |
| 
 | |
| define internal void @.omp_outlined..3(i32* noalias nocapture readnone %.global_tid., i32* noalias nocapture readnone %.bound_tid., i32* nocapture nonnull readonly align 4 dereferenceable(4) %a)  {
 | |
| entry:
 | |
|   %0 = load i32, i32* %a, align 4
 | |
|   call void @use(i32 %0)
 | |
|   ret void
 | |
| }
 | |
| 
 | |
| define dso_local void @unmergable_num_threads(i32 %a) local_unnamed_addr  {
 | |
| entry:
 | |
|   %a.addr = alloca i32, align 4
 | |
|   %0 = call i32 @__kmpc_global_thread_num(%struct.ident_t* nonnull @1)
 | |
|   store i32 %a, i32* %a.addr, align 4
 | |
|   call void @__kmpc_push_num_threads(%struct.ident_t* nonnull @1, i32 %0, i32 %a)
 | |
|   call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* nonnull @1, i32 1, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*)* @.omp_outlined..4 to void (i32*, i32*, ...)*), i32* nonnull %a.addr)
 | |
|   call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* nonnull @1, i32 1, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*)* @.omp_outlined..5 to void (i32*, i32*, ...)*), i32* nonnull %a.addr)
 | |
|   ret void
 | |
| }
 | |
| 
 | |
| define internal void @.omp_outlined..4(i32* noalias nocapture readnone %.global_tid., i32* noalias nocapture readnone %.bound_tid., i32* nocapture nonnull readonly align 4 dereferenceable(4) %a)  {
 | |
| entry:
 | |
|   %0 = load i32, i32* %a, align 4
 | |
|   call void @use(i32 %0)
 | |
|   ret void
 | |
| }
 | |
| 
 | |
| declare void @__kmpc_push_num_threads(%struct.ident_t*, i32, i32) local_unnamed_addr
 | |
| 
 | |
| define internal void @.omp_outlined..5(i32* noalias nocapture readnone %.global_tid., i32* noalias nocapture readnone %.bound_tid., i32* nocapture nonnull readonly align 4 dereferenceable(4) %a)  {
 | |
| entry:
 | |
|   %0 = load i32, i32* %a, align 4
 | |
|   call void @use(i32 %0)
 | |
|   ret void
 | |
| }
 | |
| 
 | |
| define dso_local void @unmergable_seq_call(i32 %a) local_unnamed_addr  {
 | |
| entry:
 | |
|   %a.addr = alloca i32, align 4
 | |
|   store i32 %a, i32* %a.addr, align 4
 | |
|   call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* nonnull @1, i32 1, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*)* @.omp_outlined..6 to void (i32*, i32*, ...)*), i32* nonnull %a.addr)
 | |
|   call void (...) @foo()
 | |
|   call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* nonnull @1, i32 1, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*)* @.omp_outlined..7 to void (i32*, i32*, ...)*), i32* nonnull %a.addr)
 | |
|   ret void
 | |
| }
 | |
| 
 | |
| define internal void @.omp_outlined..6(i32* noalias nocapture readnone %.global_tid., i32* noalias nocapture readnone %.bound_tid., i32* nocapture nonnull readonly align 4 dereferenceable(4) %a)  {
 | |
| entry:
 | |
|   %0 = load i32, i32* %a, align 4
 | |
|   call void @use(i32 %0)
 | |
|   ret void
 | |
| }
 | |
| 
 | |
| declare dso_local void @foo(...) local_unnamed_addr
 | |
| 
 | |
| define internal void @.omp_outlined..7(i32* noalias nocapture readnone %.global_tid., i32* noalias nocapture readnone %.bound_tid., i32* nocapture nonnull readonly align 4 dereferenceable(4) %a)  {
 | |
| entry:
 | |
|   %0 = load i32, i32* %a, align 4
 | |
|   call void @use(i32 %0)
 | |
|   ret void
 | |
| }
 | |
| 
 | |
| define dso_local void @merge_seq(i32 %a) local_unnamed_addr  {
 | |
| entry:
 | |
|   %a.addr = alloca i32, align 4
 | |
|   store i32 %a, i32* %a.addr, align 4
 | |
|   call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* nonnull @1, i32 1, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*)* @.omp_outlined..8 to void (i32*, i32*, ...)*), i32* nonnull %a.addr)
 | |
|   %0 = load i32, i32* %a.addr, align 4
 | |
|   %add = add nsw i32 %0, 1
 | |
|   store i32 %add, i32* %a.addr, align 4
 | |
|   call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* nonnull @1, i32 1, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*)* @.omp_outlined..9 to void (i32*, i32*, ...)*), i32* nonnull %a.addr)
 | |
|   %1 = load i32, i32* %a.addr, align 4
 | |
|   call void @use(i32 %1)
 | |
|   ret void
 | |
| }
 | |
| 
 | |
| define internal void @.omp_outlined..8(i32* noalias nocapture readnone %.global_tid., i32* noalias nocapture readnone %.bound_tid., i32* nocapture nonnull readonly align 4 dereferenceable(4) %a)  {
 | |
| entry:
 | |
|   %0 = load i32, i32* %a, align 4
 | |
|   call void @use(i32 %0)
 | |
|   ret void
 | |
| }
 | |
| 
 | |
| define internal void @.omp_outlined..9(i32* noalias nocapture readnone %.global_tid., i32* noalias nocapture readnone %.bound_tid., i32* nocapture nonnull readonly align 4 dereferenceable(4) %a)  {
 | |
| entry:
 | |
|   %0 = load i32, i32* %a, align 4
 | |
|   call void @use(i32 %0)
 | |
|   ret void
 | |
| }
 | |
| 
 | |
| define dso_local void @merge_seq_float(float %f, float* nocapture %p) local_unnamed_addr  {
 | |
| entry:
 | |
|   %f.addr = alloca float, align 4
 | |
|   store float %f, float* %f.addr, align 4
 | |
|   call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* nonnull @1, i32 1, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, float*)* @.omp_outlined..10 to void (i32*, i32*, ...)*), float* nonnull %f.addr)
 | |
|   %0 = load float, float* %f.addr, align 4
 | |
|   %add = fadd float %0, 0x40091EB860000000
 | |
|   store float %add, float* %p, align 4
 | |
|   call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* nonnull @1, i32 1, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, float*)* @.omp_outlined..11 to void (i32*, i32*, ...)*), float* nonnull %f.addr)
 | |
|   ret void
 | |
| }
 | |
| 
 | |
| define internal void @.omp_outlined..10(i32* noalias nocapture readnone %.global_tid., i32* noalias nocapture readnone %.bound_tid., float* nocapture nonnull readonly align 4 dereferenceable(4) %f)  {
 | |
| entry:
 | |
|   %0 = load float, float* %f, align 4
 | |
|   %conv = fptosi float %0 to i32
 | |
|   call void @use(i32 %conv)
 | |
|   ret void
 | |
| }
 | |
| 
 | |
| define internal void @.omp_outlined..11(i32* noalias nocapture readnone %.global_tid., i32* noalias nocapture readnone %.bound_tid., float* nocapture nonnull readonly align 4 dereferenceable(4) %f)  {
 | |
| entry:
 | |
|   %0 = load float, float* %f, align 4
 | |
|   %conv = fptosi float %0 to i32
 | |
|   call void @use(i32 %conv)
 | |
|   ret void
 | |
| }
 | |
| 
 | |
| define dso_local void @merge_seq_firstprivate(i32 %a) local_unnamed_addr  {
 | |
| entry:
 | |
|   %a.addr = alloca i32, align 4
 | |
|   store i32 %a, i32* %a.addr, align 4
 | |
|   call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* nonnull @1, i32 1, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*)* @.omp_outlined..12 to void (i32*, i32*, ...)*), i32* nonnull %a.addr)
 | |
|   %0 = load i32, i32* %a.addr, align 4
 | |
|   %add = add nsw i32 %0, 1
 | |
|   store i32 %add, i32* %a.addr, align 4
 | |
|   %a.casted.sroa.0.0.insert.ext = zext i32 %add to i64
 | |
|   call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* nonnull @1, i32 1, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i64)* @.omp_outlined..13 to void (i32*, i32*, ...)*), i64 %a.casted.sroa.0.0.insert.ext)
 | |
|   %1 = load i32, i32* %a.addr, align 4
 | |
|   call void @use(i32 %1)
 | |
|   ret void
 | |
| }
 | |
| 
 | |
| define internal void @.omp_outlined..12(i32* noalias nocapture readnone %.global_tid., i32* noalias nocapture readnone %.bound_tid., i32* nocapture nonnull readonly align 4 dereferenceable(4) %a)  {
 | |
| entry:
 | |
|   %0 = load i32, i32* %a, align 4
 | |
|   call void @use(i32 %0)
 | |
|   ret void
 | |
| }
 | |
| 
 | |
| define internal void @.omp_outlined..13(i32* noalias nocapture readnone %.global_tid., i32* noalias nocapture readnone %.bound_tid., i64 %a)  {
 | |
| entry:
 | |
|   %a.addr.sroa.0.0.extract.trunc = trunc i64 %a to i32
 | |
|   call void @use(i32 %a.addr.sroa.0.0.extract.trunc)
 | |
|   ret void
 | |
| }
 | |
| 
 | |
| define dso_local void @merge_seq_sink_lt(i32 %a) local_unnamed_addr  {
 | |
| entry:
 | |
|   %a.addr = alloca i32, align 4
 | |
|   %b = alloca i32, align 4
 | |
|   store i32 %a, i32* %a.addr, align 4
 | |
|   call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* nonnull @1, i32 1, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*)* @.omp_outlined..14 to void (i32*, i32*, ...)*), i32* nonnull %a.addr)
 | |
|   %0 = bitcast i32* %b to i8*
 | |
|   call void @llvm.lifetime.start.p0i8(i64 4, i8* nonnull %0)
 | |
|   %1 = ptrtoint i32* %b to i64
 | |
|   %2 = trunc i64 %1 to i32
 | |
|   store i32 %2, i32* %b, align 4
 | |
|   call void @llvm.lifetime.end.p0i8(i64 4, i8* nonnull %0)
 | |
|   call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* nonnull @1, i32 1, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*)* @.omp_outlined..15 to void (i32*, i32*, ...)*), i32* nonnull %a.addr)
 | |
|   ret void
 | |
| }
 | |
| 
 | |
| define internal void @.omp_outlined..14(i32* noalias nocapture readnone %.global_tid., i32* noalias nocapture readnone %.bound_tid., i32* nocapture nonnull readonly align 4 dereferenceable(4) %a)  {
 | |
| entry:
 | |
|   %0 = load i32, i32* %a, align 4
 | |
|   call void @use(i32 %0)
 | |
|   ret void
 | |
| }
 | |
| 
 | |
| declare void @llvm.lifetime.start.p0i8(i64 immarg, i8* nocapture)
 | |
| 
 | |
| declare void @llvm.lifetime.end.p0i8(i64 immarg, i8* nocapture)
 | |
| 
 | |
| define internal void @.omp_outlined..15(i32* noalias nocapture readnone %.global_tid., i32* noalias nocapture readnone %.bound_tid., i32* nocapture nonnull readonly align 4 dereferenceable(4) %a)  {
 | |
| entry:
 | |
|   %0 = load i32, i32* %a, align 4
 | |
|   call void @use(i32 %0)
 | |
|   ret void
 | |
| }
 | |
| 
 | |
| define dso_local void @merge_seq_par_use(i32 %a) local_unnamed_addr  {
 | |
| entry:
 | |
|   %a.addr = alloca i32, align 4
 | |
|   %b = alloca i32, align 4
 | |
|   store i32 %a, i32* %a.addr, align 4
 | |
|   call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* nonnull @1, i32 1, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*)* @.omp_outlined..16 to void (i32*, i32*, ...)*), i32* nonnull %a.addr)
 | |
|   %0 = bitcast i32* %b to i8*
 | |
|   call void @llvm.lifetime.start.p0i8(i64 4, i8* nonnull %0)
 | |
|   %1 = load i32, i32* %a.addr, align 4
 | |
|   %add = add nsw i32 %1, 1
 | |
|   store i32 %add, i32* %b, align 4
 | |
|   call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* nonnull @1, i32 2, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*, i32*)* @.omp_outlined..17 to void (i32*, i32*, ...)*), i32* nonnull %a.addr, i32* nonnull %b)
 | |
|   call void @llvm.lifetime.end.p0i8(i64 4, i8* nonnull %0)
 | |
|   ret void
 | |
| }
 | |
| 
 | |
| define internal void @.omp_outlined..16(i32* noalias nocapture readnone %.global_tid., i32* noalias nocapture readnone %.bound_tid., i32* nocapture nonnull readonly align 4 dereferenceable(4) %a)  {
 | |
| entry:
 | |
|   %0 = load i32, i32* %a, align 4
 | |
|   call void @use(i32 %0)
 | |
|   ret void
 | |
| }
 | |
| 
 | |
| define internal void @.omp_outlined..17(i32* noalias nocapture readnone %.global_tid., i32* noalias nocapture readnone %.bound_tid., i32* nocapture nonnull readonly align 4 dereferenceable(4) %a, i32* nocapture nonnull readonly align 4 dereferenceable(4) %b)  {
 | |
| entry:
 | |
|   %0 = load i32, i32* %a, align 4
 | |
|   call void @use(i32 %0)
 | |
|   %1 = load i32, i32* %b, align 4
 | |
|   call void @use(i32 %1)
 | |
|   ret void
 | |
| }
 | |
| 
 | |
| define dso_local void @merge_cancellable_regions(i32 %cancel1, i32 %cancel2) local_unnamed_addr  {
 | |
| entry:
 | |
|   %cancel1.addr = alloca i32, align 4
 | |
|   %cancel2.addr = alloca i32, align 4
 | |
|   store i32 %cancel1, i32* %cancel1.addr, align 4
 | |
|   store i32 %cancel2, i32* %cancel2.addr, align 4
 | |
|   call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* nonnull @1, i32 1, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*)* @.omp_outlined..18 to void (i32*, i32*, ...)*), i32* nonnull %cancel1.addr)
 | |
|   call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* nonnull @1, i32 1, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*)* @.omp_outlined..19 to void (i32*, i32*, ...)*), i32* nonnull %cancel2.addr)
 | |
|   ret void
 | |
| }
 | |
| 
 | |
| define internal void @.omp_outlined..18(i32* noalias nocapture readonly %.global_tid., i32* noalias nocapture readnone %.bound_tid., i32* nocapture nonnull readonly align 4 dereferenceable(4) %cancel1)  {
 | |
| entry:
 | |
|   %0 = load i32, i32* %cancel1, align 4
 | |
|   %tobool.not = icmp eq i32 %0, 0
 | |
|   br i1 %tobool.not, label %if.end, label %if.then
 | |
| 
 | |
| if.then:                                          ; preds = %entry
 | |
|   %1 = load i32, i32* %.global_tid., align 4
 | |
|   %2 = call i32 @__kmpc_cancel(%struct.ident_t* nonnull @1, i32 %1, i32 1)
 | |
|   ret void
 | |
| 
 | |
| if.end:                                           ; preds = %entry
 | |
|   ret void
 | |
| }
 | |
| 
 | |
| declare i32 @__kmpc_cancel(%struct.ident_t*, i32, i32) local_unnamed_addr
 | |
| 
 | |
| define internal void @.omp_outlined..19(i32* noalias nocapture readonly %.global_tid., i32* noalias nocapture readnone %.bound_tid., i32* nocapture nonnull readonly align 4 dereferenceable(4) %cancel2)  {
 | |
| entry:
 | |
|   %0 = load i32, i32* %cancel2, align 4
 | |
|   %tobool.not = icmp eq i32 %0, 0
 | |
|   br i1 %tobool.not, label %if.end, label %if.then
 | |
| 
 | |
| if.then:                                          ; preds = %entry
 | |
|   %1 = load i32, i32* %.global_tid., align 4
 | |
|   %2 = call i32 @__kmpc_cancel(%struct.ident_t* nonnull @1, i32 %1, i32 1)
 | |
|   ret void
 | |
| 
 | |
| if.end:                                           ; preds = %entry
 | |
|   ret void
 | |
| }
 | |
| 
 | |
| define dso_local void @merge_cancellable_regions_seq(i32 %cancel1, i32 %cancel2) local_unnamed_addr  {
 | |
| entry:
 | |
|   %cancel1.addr = alloca i32, align 4
 | |
|   %cancel2.addr = alloca i32, align 4
 | |
|   store i32 %cancel1, i32* %cancel1.addr, align 4
 | |
|   store i32 %cancel2, i32* %cancel2.addr, align 4
 | |
|   call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* nonnull @1, i32 1, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*)* @.omp_outlined..20 to void (i32*, i32*, ...)*), i32* nonnull %cancel1.addr)
 | |
|   %0 = load i32, i32* %cancel1.addr, align 4
 | |
|   %tobool.not = icmp eq i32 %0, 0
 | |
|   %lnot.ext = zext i1 %tobool.not to i32
 | |
|   store i32 %lnot.ext, i32* %cancel2.addr, align 4
 | |
|   call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* nonnull @1, i32 1, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*)* @.omp_outlined..21 to void (i32*, i32*, ...)*), i32* nonnull %cancel2.addr)
 | |
|   ret void
 | |
| }
 | |
| 
 | |
| define internal void @.omp_outlined..20(i32* noalias nocapture readonly %.global_tid., i32* noalias nocapture readnone %.bound_tid., i32* nocapture nonnull readonly align 4 dereferenceable(4) %cancel1)  {
 | |
| entry:
 | |
|   %0 = load i32, i32* %cancel1, align 4
 | |
|   %tobool.not = icmp eq i32 %0, 0
 | |
|   br i1 %tobool.not, label %if.end, label %if.then
 | |
| 
 | |
| if.then:                                          ; preds = %entry
 | |
|   %1 = load i32, i32* %.global_tid., align 4
 | |
|   %2 = call i32 @__kmpc_cancel(%struct.ident_t* nonnull @1, i32 %1, i32 1)
 | |
|   ret void
 | |
| 
 | |
| if.end:                                           ; preds = %entry
 | |
|   ret void
 | |
| }
 | |
| 
 | |
| define internal void @.omp_outlined..21(i32* noalias nocapture readonly %.global_tid., i32* noalias nocapture readnone %.bound_tid., i32* nocapture nonnull readonly align 4 dereferenceable(4) %cancel2)  {
 | |
| entry:
 | |
|   %0 = load i32, i32* %cancel2, align 4
 | |
|   %tobool.not = icmp eq i32 %0, 0
 | |
|   br i1 %tobool.not, label %if.end, label %if.then
 | |
| 
 | |
| if.then:                                          ; preds = %entry
 | |
|   %1 = load i32, i32* %.global_tid., align 4
 | |
|   %2 = call i32 @__kmpc_cancel(%struct.ident_t* nonnull @1, i32 %1, i32 1)
 | |
|   ret void
 | |
| 
 | |
| if.end:                                           ; preds = %entry
 | |
|   ret void
 | |
| }
 | |
| 
 | |
| define dso_local void @merge_3(i32 %a) local_unnamed_addr  {
 | |
| entry:
 | |
|   %a.addr = alloca i32, align 4
 | |
|   store i32 %a, i32* %a.addr, align 4
 | |
|   call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* nonnull @1, i32 1, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*)* @.omp_outlined..22 to void (i32*, i32*, ...)*), i32* nonnull %a.addr)
 | |
|   call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* nonnull @1, i32 1, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*)* @.omp_outlined..23 to void (i32*, i32*, ...)*), i32* nonnull %a.addr)
 | |
|   call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* nonnull @1, i32 1, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*)* @.omp_outlined..24 to void (i32*, i32*, ...)*), i32* nonnull %a.addr)
 | |
|   ret void
 | |
| }
 | |
| 
 | |
| define internal void @.omp_outlined..22(i32* noalias nocapture readnone %.global_tid., i32* noalias nocapture readnone %.bound_tid., i32* nocapture nonnull readonly align 4 dereferenceable(4) %a)  {
 | |
| entry:
 | |
|   %0 = load i32, i32* %a, align 4
 | |
|   call void @use(i32 %0)
 | |
|   ret void
 | |
| }
 | |
| 
 | |
| define internal void @.omp_outlined..23(i32* noalias nocapture readnone %.global_tid., i32* noalias nocapture readnone %.bound_tid., i32* nocapture nonnull readonly align 4 dereferenceable(4) %a)  {
 | |
| entry:
 | |
|   %0 = load i32, i32* %a, align 4
 | |
|   call void @use(i32 %0)
 | |
|   ret void
 | |
| }
 | |
| 
 | |
| define internal void @.omp_outlined..24(i32* noalias nocapture readnone %.global_tid., i32* noalias nocapture readnone %.bound_tid., i32* nocapture nonnull readonly align 4 dereferenceable(4) %a)  {
 | |
| entry:
 | |
|   %0 = load i32, i32* %a, align 4
 | |
|   call void @use(i32 %0)
 | |
|   ret void
 | |
| }
 | |
| 
 | |
| define dso_local void @merge_3_seq(i32 %a, i32 %b) local_unnamed_addr  {
 | |
| entry:
 | |
|   %a.addr = alloca i32, align 4
 | |
|   store i32 %a, i32* %a.addr, align 4
 | |
|   call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* nonnull @1, i32 1, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*)* @.omp_outlined..25 to void (i32*, i32*, ...)*), i32* nonnull %a.addr)
 | |
|   %0 = load i32, i32* %a.addr, align 4
 | |
|   %add = add nsw i32 %0, 1
 | |
|   call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* nonnull @1, i32 1, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*)* @.omp_outlined..26 to void (i32*, i32*, ...)*), i32* nonnull %a.addr)
 | |
|   %1 = load i32, i32* %a.addr, align 4
 | |
|   %add1 = add nsw i32 %add, %1
 | |
|   call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* nonnull @1, i32 1, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*)* @.omp_outlined..27 to void (i32*, i32*, ...)*), i32* nonnull %a.addr)
 | |
|   call void @use(i32 %add1)
 | |
|   ret void
 | |
| }
 | |
| 
 | |
| define internal void @.omp_outlined..25(i32* noalias nocapture readnone %.global_tid., i32* noalias nocapture readnone %.bound_tid., i32* nocapture nonnull readonly align 4 dereferenceable(4) %a)  {
 | |
| entry:
 | |
|   %0 = load i32, i32* %a, align 4
 | |
|   call void @use(i32 %0)
 | |
|   ret void
 | |
| }
 | |
| 
 | |
| define internal void @.omp_outlined..26(i32* noalias nocapture readnone %.global_tid., i32* noalias nocapture readnone %.bound_tid., i32* nocapture nonnull readonly align 4 dereferenceable(4) %a)  {
 | |
| entry:
 | |
|   %0 = load i32, i32* %a, align 4
 | |
|   call void @use(i32 %0)
 | |
|   ret void
 | |
| }
 | |
| 
 | |
| define internal void @.omp_outlined..27(i32* noalias nocapture readnone %.global_tid., i32* noalias nocapture readnone %.bound_tid., i32* nocapture nonnull readonly align 4 dereferenceable(4) %a)  {
 | |
| entry:
 | |
|   %0 = load i32, i32* %a, align 4
 | |
|   call void @use(i32 %0)
 | |
|   ret void
 | |
| }
 | |
| 
 | |
| define dso_local void @unmergable_3_seq_call(i32 %a) local_unnamed_addr  {
 | |
| entry:
 | |
|   %a.addr = alloca i32, align 4
 | |
|   store i32 %a, i32* %a.addr, align 4
 | |
|   call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* nonnull @1, i32 1, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*)* @.omp_outlined..28 to void (i32*, i32*, ...)*), i32* nonnull %a.addr)
 | |
|   call void (...) @foo()
 | |
|   call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* nonnull @1, i32 1, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*)* @.omp_outlined..29 to void (i32*, i32*, ...)*), i32* nonnull %a.addr)
 | |
|   call void (...) @foo()
 | |
|   call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* nonnull @1, i32 1, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*)* @.omp_outlined..30 to void (i32*, i32*, ...)*), i32* nonnull %a.addr)
 | |
|   ret void
 | |
| }
 | |
| 
 | |
| define internal void @.omp_outlined..28(i32* noalias nocapture readnone %.global_tid., i32* noalias nocapture readnone %.bound_tid., i32* nocapture nonnull readonly align 4 dereferenceable(4) %a)  {
 | |
| entry:
 | |
|   %0 = load i32, i32* %a, align 4
 | |
|   call void @use(i32 %0)
 | |
|   ret void
 | |
| }
 | |
| 
 | |
| define internal void @.omp_outlined..29(i32* noalias nocapture readnone %.global_tid., i32* noalias nocapture readnone %.bound_tid., i32* nocapture nonnull readonly align 4 dereferenceable(4) %a)  {
 | |
| entry:
 | |
|   %0 = load i32, i32* %a, align 4
 | |
|   call void @use(i32 %0)
 | |
|   ret void
 | |
| }
 | |
| 
 | |
| define internal void @.omp_outlined..30(i32* noalias nocapture readnone %.global_tid., i32* noalias nocapture readnone %.bound_tid., i32* nocapture nonnull readonly align 4 dereferenceable(4) %a)  {
 | |
| entry:
 | |
|   %0 = load i32, i32* %a, align 4
 | |
|   call void @use(i32 %0)
 | |
|   ret void
 | |
| }
 | |
| 
 | |
| define dso_local void @unmergable_3_proc_bind(i32 %a) local_unnamed_addr  {
 | |
| entry:
 | |
|   %a.addr = alloca i32, align 4
 | |
|   %0 = call i32 @__kmpc_global_thread_num(%struct.ident_t* nonnull @1)
 | |
|   store i32 %a, i32* %a.addr, align 4
 | |
|   call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* nonnull @1, i32 1, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*)* @.omp_outlined..31 to void (i32*, i32*, ...)*), i32* nonnull %a.addr)
 | |
|   call void @__kmpc_push_proc_bind(%struct.ident_t* nonnull @1, i32 %0, i32 3)
 | |
|   call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* nonnull @1, i32 1, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*)* @.omp_outlined..32 to void (i32*, i32*, ...)*), i32* nonnull %a.addr)
 | |
|   call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* nonnull @1, i32 1, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*)* @.omp_outlined..33 to void (i32*, i32*, ...)*), i32* nonnull %a.addr)
 | |
|   ret void
 | |
| }
 | |
| 
 | |
| define internal void @.omp_outlined..31(i32* noalias nocapture readnone %.global_tid., i32* noalias nocapture readnone %.bound_tid., i32* nocapture nonnull readonly align 4 dereferenceable(4) %a)  {
 | |
| entry:
 | |
|   %0 = load i32, i32* %a, align 4
 | |
|   call void @use(i32 %0)
 | |
|   ret void
 | |
| }
 | |
| 
 | |
| define internal void @.omp_outlined..32(i32* noalias nocapture readnone %.global_tid., i32* noalias nocapture readnone %.bound_tid., i32* nocapture nonnull readonly align 4 dereferenceable(4) %a)  {
 | |
| entry:
 | |
|   %0 = load i32, i32* %a, align 4
 | |
|   call void @use(i32 %0)
 | |
|   ret void
 | |
| }
 | |
| 
 | |
| define internal void @.omp_outlined..33(i32* noalias nocapture readnone %.global_tid., i32* noalias nocapture readnone %.bound_tid., i32* nocapture nonnull readonly align 4 dereferenceable(4) %a)  {
 | |
| entry:
 | |
|   %0 = load i32, i32* %a, align 4
 | |
|   call void @use(i32 %0)
 | |
|   ret void
 | |
| }
 | |
| 
 | |
| define dso_local void @unmergable_3_num_threads(i32 %a) local_unnamed_addr  {
 | |
| entry:
 | |
|   %a.addr = alloca i32, align 4
 | |
|   %0 = call i32 @__kmpc_global_thread_num(%struct.ident_t* nonnull @1)
 | |
|   store i32 %a, i32* %a.addr, align 4
 | |
|   call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* nonnull @1, i32 1, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*)* @.omp_outlined..34 to void (i32*, i32*, ...)*), i32* nonnull %a.addr)
 | |
|   %1 = load i32, i32* %a.addr, align 4
 | |
|   call void @__kmpc_push_num_threads(%struct.ident_t* nonnull @1, i32 %0, i32 %1)
 | |
|   call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* nonnull @1, i32 1, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*)* @.omp_outlined..35 to void (i32*, i32*, ...)*), i32* nonnull %a.addr)
 | |
|   call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* nonnull @1, i32 1, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*)* @.omp_outlined..36 to void (i32*, i32*, ...)*), i32* nonnull %a.addr)
 | |
|   ret void
 | |
| }
 | |
| 
 | |
| define internal void @.omp_outlined..34(i32* noalias nocapture readnone %.global_tid., i32* noalias nocapture readnone %.bound_tid., i32* nocapture nonnull readonly align 4 dereferenceable(4) %a)  {
 | |
| entry:
 | |
|   %0 = load i32, i32* %a, align 4
 | |
|   call void @use(i32 %0)
 | |
|   ret void
 | |
| }
 | |
| 
 | |
| define internal void @.omp_outlined..35(i32* noalias nocapture readnone %.global_tid., i32* noalias nocapture readnone %.bound_tid., i32* nocapture nonnull readonly align 4 dereferenceable(4) %a)  {
 | |
| entry:
 | |
|   %0 = load i32, i32* %a, align 4
 | |
|   call void @use(i32 %0)
 | |
|   ret void
 | |
| }
 | |
| 
 | |
| define internal void @.omp_outlined..36(i32* noalias nocapture readnone %.global_tid., i32* noalias nocapture readnone %.bound_tid., i32* nocapture nonnull readonly align 4 dereferenceable(4) %a)  {
 | |
| entry:
 | |
|   %0 = load i32, i32* %a, align 4
 | |
|   call void @use(i32 %0)
 | |
|   ret void
 | |
| }
 | |
| 
 | |
| define dso_local void @merge_2_unmergable_1(i32 %a) local_unnamed_addr  {
 | |
| entry:
 | |
|   %a.addr = alloca i32, align 4
 | |
|   store i32 %a, i32* %a.addr, align 4
 | |
|   call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* nonnull @1, i32 1, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*)* @.omp_outlined..37 to void (i32*, i32*, ...)*), i32* nonnull %a.addr)
 | |
|   call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* nonnull @1, i32 1, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*)* @.omp_outlined..38 to void (i32*, i32*, ...)*), i32* nonnull %a.addr)
 | |
|   call void (...) @foo()
 | |
|   call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* nonnull @1, i32 1, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*)* @.omp_outlined..39 to void (i32*, i32*, ...)*), i32* nonnull %a.addr)
 | |
|   ret void
 | |
| }
 | |
| 
 | |
| define internal void @.omp_outlined..37(i32* noalias nocapture readnone %.global_tid., i32* noalias nocapture readnone %.bound_tid., i32* nocapture nonnull readonly align 4 dereferenceable(4) %a)  {
 | |
| entry:
 | |
|   %0 = load i32, i32* %a, align 4
 | |
|   call void @use(i32 %0)
 | |
|   ret void
 | |
| }
 | |
| 
 | |
| define internal void @.omp_outlined..38(i32* noalias nocapture readnone %.global_tid., i32* noalias nocapture readnone %.bound_tid., i32* nocapture nonnull readonly align 4 dereferenceable(4) %a)  {
 | |
| entry:
 | |
|   %0 = load i32, i32* %a, align 4
 | |
|   call void @use(i32 %0)
 | |
|   ret void
 | |
| }
 | |
| 
 | |
| define internal void @.omp_outlined..39(i32* noalias nocapture readnone %.global_tid., i32* noalias nocapture readnone %.bound_tid., i32* nocapture nonnull readonly align 4 dereferenceable(4) %a)  {
 | |
| entry:
 | |
|   %0 = load i32, i32* %a, align 4
 | |
|   call void @use(i32 %0)
 | |
|   ret void
 | |
| }
 | |
| 
 | |
| 
 | |
| !llvm.module.flags = !{!0, !3}
 | |
| 
 | |
| !0 = !{i32 1, !"wchar_size", i32 4}
 | |
| !1 = !{!2}
 | |
| !2 = !{i64 2, i64 -1, i64 -1, i1 true}
 | |
| !3 = !{i32 7, !"openmp", i32 50}
 | |
| ; CHECK-LABEL: define {{[^@]+}}@merge
 | |
| ; CHECK-SAME: (i32 [[A:%.*]]) local_unnamed_addr {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[A_ADDR:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    store i32 [[A]], i32* [[A_ADDR]], align 4
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1:[0-9]+]])
 | |
| ; CHECK-NEXT:    br label [[OMP_PARALLEL:%.*]]
 | |
| ; CHECK:       omp_parallel:
 | |
| ; CHECK-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB1]], i32 1, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*)* @merge..omp_par to void (i32*, i32*, ...)*), i32* [[A_ADDR]])
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT:%.*]]
 | |
| ; CHECK:       omp.par.outlined.exit:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_EXIT_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.exit.split:
 | |
| ; CHECK-NEXT:    br label [[ENTRY_SPLIT_SPLIT:%.*]]
 | |
| ; CHECK:       entry.split.split:
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@merge..omp_par
 | |
| ; CHECK-SAME: (i32* noalias [[TID_ADDR:%.*]], i32* noalias [[ZERO_ADDR:%.*]], i32* [[A_ADDR:%.*]]) #[[ATTR0:[0-9]+]] {
 | |
| ; CHECK-NEXT:  omp.par.entry:
 | |
| ; CHECK-NEXT:    [[TID_ADDR_LOCAL:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[TID_ADDR]], align 4
 | |
| ; CHECK-NEXT:    store i32 [[TMP0]], i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK-NEXT:    [[TID:%.*]] = load i32, i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_REGION:%.*]]
 | |
| ; CHECK:       omp.par.outlined.exit.exitStub:
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK:       omp.par.region:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_MERGED:%.*]]
 | |
| ; CHECK:       omp.par.merged:
 | |
| ; CHECK-NEXT:    call void @.omp_outlined.(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB2:[0-9]+]], i32 [[OMP_GLOBAL_THREAD_NUM]])
 | |
| ; CHECK-NEXT:    call void @.omp_outlined..1(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    br label [[ENTRY_SPLIT:%.*]]
 | |
| ; CHECK:       entry.split:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_REGION_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.region.split:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_PRE_FINALIZE:%.*]]
 | |
| ; CHECK:       omp.par.pre_finalize:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT_EXITSTUB:%.*]]
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined.
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..1
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@unmergable_proc_bind
 | |
| ; CHECK-SAME: (i32 [[A:%.*]]) local_unnamed_addr {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[A_ADDR:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]])
 | |
| ; CHECK-NEXT:    store i32 [[A]], i32* [[A_ADDR]], align 4
 | |
| ; CHECK-NEXT:    call void @__kmpc_push_proc_bind(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]], i32 [[TMP0]], i32 noundef 3)
 | |
| ; CHECK-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]], i32 noundef 1, void (i32*, i32*, ...)* noundef bitcast (void (i32*, i32*, i32*)* @.omp_outlined..2 to void (i32*, i32*, ...)*), i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]], i32 noundef 1, void (i32*, i32*, ...)* noundef bitcast (void (i32*, i32*, i32*)* @.omp_outlined..3 to void (i32*, i32*, ...)*), i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..2
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..3
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@unmergable_num_threads
 | |
| ; CHECK-SAME: (i32 [[A:%.*]]) local_unnamed_addr {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[A_ADDR:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]])
 | |
| ; CHECK-NEXT:    store i32 [[A]], i32* [[A_ADDR]], align 4
 | |
| ; CHECK-NEXT:    call void @__kmpc_push_num_threads(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]], i32 [[TMP0]], i32 [[A]])
 | |
| ; CHECK-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]], i32 noundef 1, void (i32*, i32*, ...)* noundef bitcast (void (i32*, i32*, i32*)* @.omp_outlined..4 to void (i32*, i32*, ...)*), i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]], i32 noundef 1, void (i32*, i32*, ...)* noundef bitcast (void (i32*, i32*, i32*)* @.omp_outlined..5 to void (i32*, i32*, ...)*), i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..4
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..5
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@unmergable_seq_call
 | |
| ; CHECK-SAME: (i32 [[A:%.*]]) local_unnamed_addr {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[A_ADDR:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    store i32 [[A]], i32* [[A_ADDR]], align 4
 | |
| ; CHECK-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]], i32 noundef 1, void (i32*, i32*, ...)* noundef bitcast (void (i32*, i32*, i32*)* @.omp_outlined..6 to void (i32*, i32*, ...)*), i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    call void (...) @foo()
 | |
| ; CHECK-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]], i32 noundef 1, void (i32*, i32*, ...)* noundef bitcast (void (i32*, i32*, i32*)* @.omp_outlined..7 to void (i32*, i32*, ...)*), i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..6
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..7
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@merge_seq
 | |
| ; CHECK-SAME: (i32 [[A:%.*]]) local_unnamed_addr {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[A_ADDR:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    store i32 [[A]], i32* [[A_ADDR]], align 4
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM2:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    br label [[OMP_PARALLEL:%.*]]
 | |
| ; CHECK:       omp_parallel:
 | |
| ; CHECK-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB1]], i32 1, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*)* @merge_seq..omp_par to void (i32*, i32*, ...)*), i32* [[A_ADDR]])
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT:%.*]]
 | |
| ; CHECK:       omp.par.outlined.exit:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_EXIT_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.exit.split:
 | |
| ; CHECK-NEXT:    br label [[ENTRY_SPLIT_SPLIT:%.*]]
 | |
| ; CHECK:       entry.split.split:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A_ADDR]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@merge_seq..omp_par
 | |
| ; CHECK-SAME: (i32* noalias [[TID_ADDR:%.*]], i32* noalias [[ZERO_ADDR:%.*]], i32* [[A_ADDR:%.*]]) #[[ATTR0]] {
 | |
| ; CHECK-NEXT:  omp.par.entry:
 | |
| ; CHECK-NEXT:    [[TID_ADDR_LOCAL:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[TID_ADDR]], align 4
 | |
| ; CHECK-NEXT:    store i32 [[TMP0]], i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK-NEXT:    [[TID:%.*]] = load i32, i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_REGION:%.*]]
 | |
| ; CHECK:       omp.par.outlined.exit.exitStub:
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK:       omp.par.region:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_MERGED:%.*]]
 | |
| ; CHECK:       omp.par.merged:
 | |
| ; CHECK-NEXT:    call void @.omp_outlined..8(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM2:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB2]], i32 [[OMP_GLOBAL_THREAD_NUM2]])
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    [[TMP1:%.*]] = call i32 @__kmpc_master(%struct.ident_t* @[[GLOB1]], i32 [[OMP_GLOBAL_THREAD_NUM]])
 | |
| ; CHECK-NEXT:    [[TMP2:%.*]] = icmp ne i32 [[TMP1]], 0
 | |
| ; CHECK-NEXT:    br i1 [[TMP2]], label [[OMP_REGION_BODY:%.*]], label [[OMP_REGION_END:%.*]]
 | |
| ; CHECK:       omp_region.end:
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM1:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB2]], i32 [[OMP_GLOBAL_THREAD_NUM1]])
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_MERGED_SPLIT_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.merged.split.split:
 | |
| ; CHECK-NEXT:    call void @.omp_outlined..9(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    br label [[ENTRY_SPLIT:%.*]]
 | |
| ; CHECK:       entry.split:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_REGION_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.region.split:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_PRE_FINALIZE:%.*]]
 | |
| ; CHECK:       omp.par.pre_finalize:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT_EXITSTUB:%.*]]
 | |
| ; CHECK:       omp_region.body:
 | |
| ; CHECK-NEXT:    br label [[SEQ_PAR_MERGED:%.*]]
 | |
| ; CHECK:       seq.par.merged:
 | |
| ; CHECK-NEXT:    [[TMP3:%.*]] = load i32, i32* [[A_ADDR]], align 4
 | |
| ; CHECK-NEXT:    [[ADD:%.*]] = add nsw i32 [[TMP3]], 1
 | |
| ; CHECK-NEXT:    store i32 [[ADD]], i32* [[A_ADDR]], align 4
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_MERGED_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.merged.split:
 | |
| ; CHECK-NEXT:    br label [[OMP_REGION_BODY_SPLIT:%.*]]
 | |
| ; CHECK:       omp_region.body.split:
 | |
| ; CHECK-NEXT:    call void @__kmpc_end_master(%struct.ident_t* @[[GLOB1]], i32 [[OMP_GLOBAL_THREAD_NUM]])
 | |
| ; CHECK-NEXT:    br label [[OMP_REGION_END]]
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..8
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..9
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@merge_seq_float
 | |
| ; CHECK-SAME: (float [[F:%.*]], float* nocapture nofree writeonly [[P:%.*]]) local_unnamed_addr {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[F_ADDR:%.*]] = alloca float, align 4
 | |
| ; CHECK-NEXT:    store float [[F]], float* [[F_ADDR]], align 4
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM2:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    br label [[OMP_PARALLEL:%.*]]
 | |
| ; CHECK:       omp_parallel:
 | |
| ; CHECK-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB1]], i32 2, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, float*, float*)* @merge_seq_float..omp_par to void (i32*, i32*, ...)*), float* [[F_ADDR]], float* [[P]])
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT:%.*]]
 | |
| ; CHECK:       omp.par.outlined.exit:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_EXIT_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.exit.split:
 | |
| ; CHECK-NEXT:    br label [[ENTRY_SPLIT_SPLIT:%.*]]
 | |
| ; CHECK:       entry.split.split:
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@merge_seq_float..omp_par
 | |
| ; CHECK-SAME: (i32* noalias [[TID_ADDR:%.*]], i32* noalias [[ZERO_ADDR:%.*]], float* [[F_ADDR:%.*]], float* [[P:%.*]]) #[[ATTR0]] {
 | |
| ; CHECK-NEXT:  omp.par.entry:
 | |
| ; CHECK-NEXT:    [[TID_ADDR_LOCAL:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[TID_ADDR]], align 4
 | |
| ; CHECK-NEXT:    store i32 [[TMP0]], i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK-NEXT:    [[TID:%.*]] = load i32, i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_REGION:%.*]]
 | |
| ; CHECK:       omp.par.outlined.exit.exitStub:
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK:       omp.par.region:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_MERGED:%.*]]
 | |
| ; CHECK:       omp.par.merged:
 | |
| ; CHECK-NEXT:    call void @.omp_outlined..10(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], float* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[F_ADDR]])
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM2:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB2]], i32 [[OMP_GLOBAL_THREAD_NUM2]])
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    [[TMP1:%.*]] = call i32 @__kmpc_master(%struct.ident_t* @[[GLOB1]], i32 [[OMP_GLOBAL_THREAD_NUM]])
 | |
| ; CHECK-NEXT:    [[TMP2:%.*]] = icmp ne i32 [[TMP1]], 0
 | |
| ; CHECK-NEXT:    br i1 [[TMP2]], label [[OMP_REGION_BODY:%.*]], label [[OMP_REGION_END:%.*]]
 | |
| ; CHECK:       omp_region.end:
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM1:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB2]], i32 [[OMP_GLOBAL_THREAD_NUM1]])
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_MERGED_SPLIT_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.merged.split.split:
 | |
| ; CHECK-NEXT:    call void @.omp_outlined..11(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], float* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[F_ADDR]])
 | |
| ; CHECK-NEXT:    br label [[ENTRY_SPLIT:%.*]]
 | |
| ; CHECK:       entry.split:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_REGION_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.region.split:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_PRE_FINALIZE:%.*]]
 | |
| ; CHECK:       omp.par.pre_finalize:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT_EXITSTUB:%.*]]
 | |
| ; CHECK:       omp_region.body:
 | |
| ; CHECK-NEXT:    br label [[SEQ_PAR_MERGED:%.*]]
 | |
| ; CHECK:       seq.par.merged:
 | |
| ; CHECK-NEXT:    [[TMP3:%.*]] = load float, float* [[F_ADDR]], align 4
 | |
| ; CHECK-NEXT:    [[ADD:%.*]] = fadd float [[TMP3]], 0x40091EB860000000
 | |
| ; CHECK-NEXT:    store float [[ADD]], float* [[P]], align 4
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_MERGED_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.merged.split:
 | |
| ; CHECK-NEXT:    br label [[OMP_REGION_BODY_SPLIT:%.*]]
 | |
| ; CHECK:       omp_region.body.split:
 | |
| ; CHECK-NEXT:    call void @__kmpc_end_master(%struct.ident_t* @[[GLOB1]], i32 [[OMP_GLOBAL_THREAD_NUM]])
 | |
| ; CHECK-NEXT:    br label [[OMP_REGION_END]]
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..10
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], float* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[F:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load float, float* [[F]], align 4
 | |
| ; CHECK-NEXT:    [[CONV:%.*]] = fptosi float [[TMP0]] to i32
 | |
| ; CHECK-NEXT:    call void @use(i32 [[CONV]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..11
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], float* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[F:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load float, float* [[F]], align 4
 | |
| ; CHECK-NEXT:    [[CONV:%.*]] = fptosi float [[TMP0]] to i32
 | |
| ; CHECK-NEXT:    call void @use(i32 [[CONV]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@merge_seq_firstprivate
 | |
| ; CHECK-SAME: (i32 [[A:%.*]]) local_unnamed_addr {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[A_CASTED_SROA_0_0_INSERT_EXT_SEQ_OUTPUT_ALLOC:%.*]] = alloca i64, align 8
 | |
| ; CHECK-NEXT:    [[A_ADDR:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    store i32 [[A]], i32* [[A_ADDR]], align 4
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM2:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    br label [[OMP_PARALLEL:%.*]]
 | |
| ; CHECK:       omp_parallel:
 | |
| ; CHECK-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB1]], i32 2, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*, i64*)* @merge_seq_firstprivate..omp_par to void (i32*, i32*, ...)*), i32* [[A_ADDR]], i64* [[A_CASTED_SROA_0_0_INSERT_EXT_SEQ_OUTPUT_ALLOC]])
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT:%.*]]
 | |
| ; CHECK:       omp.par.outlined.exit:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_EXIT_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.exit.split:
 | |
| ; CHECK-NEXT:    br label [[ENTRY_SPLIT_SPLIT:%.*]]
 | |
| ; CHECK:       entry.split.split:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A_ADDR]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@merge_seq_firstprivate..omp_par
 | |
| ; CHECK-SAME: (i32* noalias [[TID_ADDR:%.*]], i32* noalias [[ZERO_ADDR:%.*]], i32* [[A_ADDR:%.*]], i64* [[A_CASTED_SROA_0_0_INSERT_EXT_SEQ_OUTPUT_ALLOC:%.*]]) #[[ATTR0]] {
 | |
| ; CHECK-NEXT:  omp.par.entry:
 | |
| ; CHECK-NEXT:    [[TID_ADDR_LOCAL:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[TID_ADDR]], align 4
 | |
| ; CHECK-NEXT:    store i32 [[TMP0]], i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK-NEXT:    [[TID:%.*]] = load i32, i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_REGION:%.*]]
 | |
| ; CHECK:       omp.par.outlined.exit.exitStub:
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK:       omp.par.region:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_MERGED:%.*]]
 | |
| ; CHECK:       omp.par.merged:
 | |
| ; CHECK-NEXT:    call void @.omp_outlined..12(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM2:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB2]], i32 [[OMP_GLOBAL_THREAD_NUM2]])
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    [[TMP1:%.*]] = call i32 @__kmpc_master(%struct.ident_t* @[[GLOB1]], i32 [[OMP_GLOBAL_THREAD_NUM]])
 | |
| ; CHECK-NEXT:    [[TMP2:%.*]] = icmp ne i32 [[TMP1]], 0
 | |
| ; CHECK-NEXT:    br i1 [[TMP2]], label [[OMP_REGION_BODY:%.*]], label [[OMP_REGION_END:%.*]]
 | |
| ; CHECK:       omp_region.end:
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM1:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB2]], i32 [[OMP_GLOBAL_THREAD_NUM1]])
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_MERGED_SPLIT_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.merged.split.split:
 | |
| ; CHECK-NEXT:    [[A_CASTED_SROA_0_0_INSERT_EXT_SEQ_OUTPUT_LOAD:%.*]] = load i64, i64* [[A_CASTED_SROA_0_0_INSERT_EXT_SEQ_OUTPUT_ALLOC]], align 8
 | |
| ; CHECK-NEXT:    call void @.omp_outlined..13(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i64 [[A_CASTED_SROA_0_0_INSERT_EXT_SEQ_OUTPUT_LOAD]])
 | |
| ; CHECK-NEXT:    br label [[ENTRY_SPLIT:%.*]]
 | |
| ; CHECK:       entry.split:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_REGION_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.region.split:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_PRE_FINALIZE:%.*]]
 | |
| ; CHECK:       omp.par.pre_finalize:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT_EXITSTUB:%.*]]
 | |
| ; CHECK:       omp_region.body:
 | |
| ; CHECK-NEXT:    br label [[SEQ_PAR_MERGED:%.*]]
 | |
| ; CHECK:       seq.par.merged:
 | |
| ; CHECK-NEXT:    [[TMP3:%.*]] = load i32, i32* [[A_ADDR]], align 4
 | |
| ; CHECK-NEXT:    [[ADD:%.*]] = add nsw i32 [[TMP3]], 1
 | |
| ; CHECK-NEXT:    store i32 [[ADD]], i32* [[A_ADDR]], align 4
 | |
| ; CHECK-NEXT:    [[A_CASTED_SROA_0_0_INSERT_EXT:%.*]] = zext i32 [[ADD]] to i64
 | |
| ; CHECK-NEXT:    store i64 [[A_CASTED_SROA_0_0_INSERT_EXT]], i64* [[A_CASTED_SROA_0_0_INSERT_EXT_SEQ_OUTPUT_ALLOC]], align 8
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_MERGED_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.merged.split:
 | |
| ; CHECK-NEXT:    br label [[OMP_REGION_BODY_SPLIT:%.*]]
 | |
| ; CHECK:       omp_region.body.split:
 | |
| ; CHECK-NEXT:    call void @__kmpc_end_master(%struct.ident_t* @[[GLOB1]], i32 [[OMP_GLOBAL_THREAD_NUM]])
 | |
| ; CHECK-NEXT:    br label [[OMP_REGION_END]]
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..12
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..13
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i64 [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[A_ADDR_SROA_0_0_EXTRACT_TRUNC:%.*]] = trunc i64 [[A]] to i32
 | |
| ; CHECK-NEXT:    call void @use(i32 [[A_ADDR_SROA_0_0_EXTRACT_TRUNC]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@merge_seq_sink_lt
 | |
| ; CHECK-SAME: (i32 [[A:%.*]]) local_unnamed_addr {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[A_ADDR:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    store i32 [[A]], i32* [[A_ADDR]], align 4
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM2:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    br label [[OMP_PARALLEL:%.*]]
 | |
| ; CHECK:       omp_parallel:
 | |
| ; CHECK-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB1]], i32 1, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*)* @merge_seq_sink_lt..omp_par to void (i32*, i32*, ...)*), i32* [[A_ADDR]])
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT:%.*]]
 | |
| ; CHECK:       omp.par.outlined.exit:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_EXIT_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.exit.split:
 | |
| ; CHECK-NEXT:    br label [[ENTRY_SPLIT_SPLIT:%.*]]
 | |
| ; CHECK:       entry.split.split:
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@merge_seq_sink_lt..omp_par
 | |
| ; CHECK-SAME: (i32* noalias [[TID_ADDR:%.*]], i32* noalias [[ZERO_ADDR:%.*]], i32* [[A_ADDR:%.*]]) #[[ATTR0]] {
 | |
| ; CHECK-NEXT:  omp.par.entry:
 | |
| ; CHECK-NEXT:    [[B:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    [[TID_ADDR_LOCAL:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[TID_ADDR]], align 4
 | |
| ; CHECK-NEXT:    store i32 [[TMP0]], i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK-NEXT:    [[TID:%.*]] = load i32, i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_REGION:%.*]]
 | |
| ; CHECK:       omp.par.outlined.exit.exitStub:
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK:       omp.par.region:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_MERGED:%.*]]
 | |
| ; CHECK:       omp.par.merged:
 | |
| ; CHECK-NEXT:    call void @.omp_outlined..14(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM2:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB2]], i32 [[OMP_GLOBAL_THREAD_NUM2]])
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    [[TMP1:%.*]] = call i32 @__kmpc_master(%struct.ident_t* @[[GLOB1]], i32 [[OMP_GLOBAL_THREAD_NUM]])
 | |
| ; CHECK-NEXT:    [[TMP2:%.*]] = icmp ne i32 [[TMP1]], 0
 | |
| ; CHECK-NEXT:    br i1 [[TMP2]], label [[OMP_REGION_BODY:%.*]], label [[OMP_REGION_END:%.*]]
 | |
| ; CHECK:       omp_region.end:
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM1:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB2]], i32 [[OMP_GLOBAL_THREAD_NUM1]])
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_MERGED_SPLIT_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.merged.split.split:
 | |
| ; CHECK-NEXT:    call void @.omp_outlined..15(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    br label [[ENTRY_SPLIT:%.*]]
 | |
| ; CHECK:       entry.split:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_REGION_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.region.split:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_PRE_FINALIZE:%.*]]
 | |
| ; CHECK:       omp.par.pre_finalize:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT_EXITSTUB:%.*]]
 | |
| ; CHECK:       omp_region.body:
 | |
| ; CHECK-NEXT:    br label [[SEQ_PAR_MERGED:%.*]]
 | |
| ; CHECK:       seq.par.merged:
 | |
| ; CHECK-NEXT:    [[TMP3:%.*]] = bitcast i32* [[B]] to i8*
 | |
| ; CHECK-NEXT:    call void @llvm.lifetime.start.p0i8(i64 noundef 4, i8* noundef nonnull [[TMP3]])
 | |
| ; CHECK-NEXT:    [[TMP4:%.*]] = ptrtoint i32* [[B]] to i64
 | |
| ; CHECK-NEXT:    [[TMP5:%.*]] = trunc i64 [[TMP4]] to i32
 | |
| ; CHECK-NEXT:    store i32 [[TMP5]], i32* [[B]], align 4
 | |
| ; CHECK-NEXT:    call void @llvm.lifetime.end.p0i8(i64 noundef 4, i8* noundef nonnull [[TMP3]])
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_MERGED_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.merged.split:
 | |
| ; CHECK-NEXT:    br label [[OMP_REGION_BODY_SPLIT:%.*]]
 | |
| ; CHECK:       omp_region.body.split:
 | |
| ; CHECK-NEXT:    call void @__kmpc_end_master(%struct.ident_t* @[[GLOB1]], i32 [[OMP_GLOBAL_THREAD_NUM]])
 | |
| ; CHECK-NEXT:    br label [[OMP_REGION_END]]
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..14
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..15
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@merge_seq_par_use
 | |
| ; CHECK-SAME: (i32 [[A:%.*]]) local_unnamed_addr {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[A_ADDR:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    [[B:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    store i32 [[A]], i32* [[A_ADDR]], align 4
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM2:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    br label [[OMP_PARALLEL:%.*]]
 | |
| ; CHECK:       omp_parallel:
 | |
| ; CHECK-NEXT:    [[LT_CAST3:%.*]] = bitcast i32* [[B]] to i8*
 | |
| ; CHECK-NEXT:    call void @llvm.lifetime.start.p0i8(i64 -1, i8* [[LT_CAST3]])
 | |
| ; CHECK-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB1]], i32 2, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*, i32*)* @merge_seq_par_use..omp_par to void (i32*, i32*, ...)*), i32* [[A_ADDR]], i32* [[B]])
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT:%.*]]
 | |
| ; CHECK:       omp.par.outlined.exit:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_EXIT_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.exit.split:
 | |
| ; CHECK-NEXT:    br label [[ENTRY_SPLIT_SPLIT:%.*]]
 | |
| ; CHECK:       entry.split.split:
 | |
| ; CHECK-NEXT:    [[LT_CAST:%.*]] = bitcast i32* [[B]] to i8*
 | |
| ; CHECK-NEXT:    call void @llvm.lifetime.end.p0i8(i64 noundef 4, i8* noundef nonnull [[LT_CAST]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@merge_seq_par_use..omp_par
 | |
| ; CHECK-SAME: (i32* noalias [[TID_ADDR:%.*]], i32* noalias [[ZERO_ADDR:%.*]], i32* [[A_ADDR:%.*]], i32* [[B:%.*]]) #[[ATTR0]] {
 | |
| ; CHECK-NEXT:  omp.par.entry:
 | |
| ; CHECK-NEXT:    [[TID_ADDR_LOCAL:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[TID_ADDR]], align 4
 | |
| ; CHECK-NEXT:    store i32 [[TMP0]], i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK-NEXT:    [[TID:%.*]] = load i32, i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_REGION:%.*]]
 | |
| ; CHECK:       omp.par.outlined.exit.exitStub:
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK:       omp.par.region:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_MERGED:%.*]]
 | |
| ; CHECK:       omp.par.merged:
 | |
| ; CHECK-NEXT:    call void @.omp_outlined..16(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM2:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB2]], i32 [[OMP_GLOBAL_THREAD_NUM2]])
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    [[TMP1:%.*]] = call i32 @__kmpc_master(%struct.ident_t* @[[GLOB1]], i32 [[OMP_GLOBAL_THREAD_NUM]])
 | |
| ; CHECK-NEXT:    [[TMP2:%.*]] = icmp ne i32 [[TMP1]], 0
 | |
| ; CHECK-NEXT:    br i1 [[TMP2]], label [[OMP_REGION_BODY:%.*]], label [[OMP_REGION_END:%.*]]
 | |
| ; CHECK:       omp_region.end:
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM1:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB2]], i32 [[OMP_GLOBAL_THREAD_NUM1]])
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_MERGED_SPLIT_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.merged.split.split:
 | |
| ; CHECK-NEXT:    call void @.omp_outlined..17(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[B]])
 | |
| ; CHECK-NEXT:    br label [[ENTRY_SPLIT:%.*]]
 | |
| ; CHECK:       entry.split:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_REGION_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.region.split:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_PRE_FINALIZE:%.*]]
 | |
| ; CHECK:       omp.par.pre_finalize:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT_EXITSTUB:%.*]]
 | |
| ; CHECK:       omp_region.body:
 | |
| ; CHECK-NEXT:    br label [[SEQ_PAR_MERGED:%.*]]
 | |
| ; CHECK:       seq.par.merged:
 | |
| ; CHECK-NEXT:    [[TMP3:%.*]] = bitcast i32* [[B]] to i8*
 | |
| ; CHECK-NEXT:    [[TMP4:%.*]] = load i32, i32* [[A_ADDR]], align 4
 | |
| ; CHECK-NEXT:    [[ADD:%.*]] = add nsw i32 [[TMP4]], 1
 | |
| ; CHECK-NEXT:    store i32 [[ADD]], i32* [[B]], align 4
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_MERGED_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.merged.split:
 | |
| ; CHECK-NEXT:    br label [[OMP_REGION_BODY_SPLIT:%.*]]
 | |
| ; CHECK:       omp_region.body.split:
 | |
| ; CHECK-NEXT:    call void @__kmpc_end_master(%struct.ident_t* @[[GLOB1]], i32 [[OMP_GLOBAL_THREAD_NUM]])
 | |
| ; CHECK-NEXT:    br label [[OMP_REGION_END]]
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..16
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..17
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[B:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    [[TMP1:%.*]] = load i32, i32* [[B]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP1]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@merge_cancellable_regions
 | |
| ; CHECK-SAME: (i32 [[CANCEL1:%.*]], i32 [[CANCEL2:%.*]]) local_unnamed_addr {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[CANCEL1_ADDR:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    [[CANCEL2_ADDR:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    store i32 [[CANCEL1]], i32* [[CANCEL1_ADDR]], align 4
 | |
| ; CHECK-NEXT:    store i32 [[CANCEL2]], i32* [[CANCEL2_ADDR]], align 4
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    br label [[OMP_PARALLEL:%.*]]
 | |
| ; CHECK:       omp_parallel:
 | |
| ; CHECK-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB1]], i32 2, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*, i32*)* @merge_cancellable_regions..omp_par to void (i32*, i32*, ...)*), i32* [[CANCEL1_ADDR]], i32* [[CANCEL2_ADDR]])
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT:%.*]]
 | |
| ; CHECK:       omp.par.outlined.exit:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_EXIT_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.exit.split:
 | |
| ; CHECK-NEXT:    br label [[ENTRY_SPLIT_SPLIT:%.*]]
 | |
| ; CHECK:       entry.split.split:
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@merge_cancellable_regions..omp_par
 | |
| ; CHECK-SAME: (i32* noalias [[TID_ADDR:%.*]], i32* noalias [[ZERO_ADDR:%.*]], i32* [[CANCEL1_ADDR:%.*]], i32* [[CANCEL2_ADDR:%.*]]) #[[ATTR0]] {
 | |
| ; CHECK-NEXT:  omp.par.entry:
 | |
| ; CHECK-NEXT:    [[TID_ADDR_LOCAL:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[TID_ADDR]], align 4
 | |
| ; CHECK-NEXT:    store i32 [[TMP0]], i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK-NEXT:    [[TID:%.*]] = load i32, i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_REGION:%.*]]
 | |
| ; CHECK:       omp.par.outlined.exit.exitStub:
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK:       omp.par.region:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_MERGED:%.*]]
 | |
| ; CHECK:       omp.par.merged:
 | |
| ; CHECK-NEXT:    call void @.omp_outlined..18(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[CANCEL1_ADDR]])
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB2]], i32 [[OMP_GLOBAL_THREAD_NUM]])
 | |
| ; CHECK-NEXT:    call void @.omp_outlined..19(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[CANCEL2_ADDR]])
 | |
| ; CHECK-NEXT:    br label [[ENTRY_SPLIT:%.*]]
 | |
| ; CHECK:       entry.split:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_REGION_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.region.split:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_PRE_FINALIZE:%.*]]
 | |
| ; CHECK:       omp.par.pre_finalize:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT_EXITSTUB:%.*]]
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..18
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readonly [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[CANCEL1:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[CANCEL1]], align 4
 | |
| ; CHECK-NEXT:    [[TOBOOL_NOT:%.*]] = icmp eq i32 [[TMP0]], 0
 | |
| ; CHECK-NEXT:    br i1 [[TOBOOL_NOT]], label [[IF_END:%.*]], label [[IF_THEN:%.*]]
 | |
| ; CHECK:       if.then:
 | |
| ; CHECK-NEXT:    [[TMP1:%.*]] = load i32, i32* [[DOTGLOBAL_TID_]], align 4
 | |
| ; CHECK-NEXT:    [[TMP2:%.*]] = call i32 @__kmpc_cancel(%struct.ident_t* noundef nonnull @[[GLOB1]], i32 [[TMP1]], i32 noundef 1)
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK:       if.end:
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..19
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readonly [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[CANCEL2:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[CANCEL2]], align 4
 | |
| ; CHECK-NEXT:    [[TOBOOL_NOT:%.*]] = icmp eq i32 [[TMP0]], 0
 | |
| ; CHECK-NEXT:    br i1 [[TOBOOL_NOT]], label [[IF_END:%.*]], label [[IF_THEN:%.*]]
 | |
| ; CHECK:       if.then:
 | |
| ; CHECK-NEXT:    [[TMP1:%.*]] = load i32, i32* [[DOTGLOBAL_TID_]], align 4
 | |
| ; CHECK-NEXT:    [[TMP2:%.*]] = call i32 @__kmpc_cancel(%struct.ident_t* noundef nonnull @[[GLOB1]], i32 [[TMP1]], i32 noundef 1)
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK:       if.end:
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@merge_cancellable_regions_seq
 | |
| ; CHECK-SAME: (i32 [[CANCEL1:%.*]], i32 [[CANCEL2:%.*]]) local_unnamed_addr {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[CANCEL1_ADDR:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    [[CANCEL2_ADDR:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    store i32 [[CANCEL1]], i32* [[CANCEL1_ADDR]], align 4
 | |
| ; CHECK-NEXT:    store i32 [[CANCEL2]], i32* [[CANCEL2_ADDR]], align 4
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM2:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    br label [[OMP_PARALLEL:%.*]]
 | |
| ; CHECK:       omp_parallel:
 | |
| ; CHECK-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB1]], i32 2, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*, i32*)* @merge_cancellable_regions_seq..omp_par to void (i32*, i32*, ...)*), i32* [[CANCEL1_ADDR]], i32* [[CANCEL2_ADDR]])
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT:%.*]]
 | |
| ; CHECK:       omp.par.outlined.exit:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_EXIT_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.exit.split:
 | |
| ; CHECK-NEXT:    br label [[ENTRY_SPLIT_SPLIT:%.*]]
 | |
| ; CHECK:       entry.split.split:
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@merge_cancellable_regions_seq..omp_par
 | |
| ; CHECK-SAME: (i32* noalias [[TID_ADDR:%.*]], i32* noalias [[ZERO_ADDR:%.*]], i32* [[CANCEL1_ADDR:%.*]], i32* [[CANCEL2_ADDR:%.*]]) #[[ATTR0]] {
 | |
| ; CHECK-NEXT:  omp.par.entry:
 | |
| ; CHECK-NEXT:    [[TID_ADDR_LOCAL:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[TID_ADDR]], align 4
 | |
| ; CHECK-NEXT:    store i32 [[TMP0]], i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK-NEXT:    [[TID:%.*]] = load i32, i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_REGION:%.*]]
 | |
| ; CHECK:       omp.par.outlined.exit.exitStub:
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK:       omp.par.region:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_MERGED:%.*]]
 | |
| ; CHECK:       omp.par.merged:
 | |
| ; CHECK-NEXT:    call void @.omp_outlined..20(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[CANCEL1_ADDR]])
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM2:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB2]], i32 [[OMP_GLOBAL_THREAD_NUM2]])
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    [[TMP1:%.*]] = call i32 @__kmpc_master(%struct.ident_t* @[[GLOB1]], i32 [[OMP_GLOBAL_THREAD_NUM]])
 | |
| ; CHECK-NEXT:    [[TMP2:%.*]] = icmp ne i32 [[TMP1]], 0
 | |
| ; CHECK-NEXT:    br i1 [[TMP2]], label [[OMP_REGION_BODY:%.*]], label [[OMP_REGION_END:%.*]]
 | |
| ; CHECK:       omp_region.end:
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM1:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB2]], i32 [[OMP_GLOBAL_THREAD_NUM1]])
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_MERGED_SPLIT_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.merged.split.split:
 | |
| ; CHECK-NEXT:    call void @.omp_outlined..21(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[CANCEL2_ADDR]])
 | |
| ; CHECK-NEXT:    br label [[ENTRY_SPLIT:%.*]]
 | |
| ; CHECK:       entry.split:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_REGION_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.region.split:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_PRE_FINALIZE:%.*]]
 | |
| ; CHECK:       omp.par.pre_finalize:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT_EXITSTUB:%.*]]
 | |
| ; CHECK:       omp_region.body:
 | |
| ; CHECK-NEXT:    br label [[SEQ_PAR_MERGED:%.*]]
 | |
| ; CHECK:       seq.par.merged:
 | |
| ; CHECK-NEXT:    [[TMP3:%.*]] = load i32, i32* [[CANCEL1_ADDR]], align 4
 | |
| ; CHECK-NEXT:    [[TOBOOL_NOT:%.*]] = icmp eq i32 [[TMP3]], 0
 | |
| ; CHECK-NEXT:    [[LNOT_EXT:%.*]] = zext i1 [[TOBOOL_NOT]] to i32
 | |
| ; CHECK-NEXT:    store i32 [[LNOT_EXT]], i32* [[CANCEL2_ADDR]], align 4
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_MERGED_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.merged.split:
 | |
| ; CHECK-NEXT:    br label [[OMP_REGION_BODY_SPLIT:%.*]]
 | |
| ; CHECK:       omp_region.body.split:
 | |
| ; CHECK-NEXT:    call void @__kmpc_end_master(%struct.ident_t* @[[GLOB1]], i32 [[OMP_GLOBAL_THREAD_NUM]])
 | |
| ; CHECK-NEXT:    br label [[OMP_REGION_END]]
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..20
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readonly [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[CANCEL1:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[CANCEL1]], align 4
 | |
| ; CHECK-NEXT:    [[TOBOOL_NOT:%.*]] = icmp eq i32 [[TMP0]], 0
 | |
| ; CHECK-NEXT:    br i1 [[TOBOOL_NOT]], label [[IF_END:%.*]], label [[IF_THEN:%.*]]
 | |
| ; CHECK:       if.then:
 | |
| ; CHECK-NEXT:    [[TMP1:%.*]] = load i32, i32* [[DOTGLOBAL_TID_]], align 4
 | |
| ; CHECK-NEXT:    [[TMP2:%.*]] = call i32 @__kmpc_cancel(%struct.ident_t* noundef nonnull @[[GLOB1]], i32 [[TMP1]], i32 noundef 1)
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK:       if.end:
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..21
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readonly [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[CANCEL2:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[CANCEL2]], align 4
 | |
| ; CHECK-NEXT:    [[TOBOOL_NOT:%.*]] = icmp eq i32 [[TMP0]], 0
 | |
| ; CHECK-NEXT:    br i1 [[TOBOOL_NOT]], label [[IF_END:%.*]], label [[IF_THEN:%.*]]
 | |
| ; CHECK:       if.then:
 | |
| ; CHECK-NEXT:    [[TMP1:%.*]] = load i32, i32* [[DOTGLOBAL_TID_]], align 4
 | |
| ; CHECK-NEXT:    [[TMP2:%.*]] = call i32 @__kmpc_cancel(%struct.ident_t* noundef nonnull @[[GLOB1]], i32 [[TMP1]], i32 noundef 1)
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK:       if.end:
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@merge_3
 | |
| ; CHECK-SAME: (i32 [[A:%.*]]) local_unnamed_addr {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[A_ADDR:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    store i32 [[A]], i32* [[A_ADDR]], align 4
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    br label [[OMP_PARALLEL:%.*]]
 | |
| ; CHECK:       omp_parallel:
 | |
| ; CHECK-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB1]], i32 1, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*)* @merge_3..omp_par to void (i32*, i32*, ...)*), i32* [[A_ADDR]])
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT:%.*]]
 | |
| ; CHECK:       omp.par.outlined.exit:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_EXIT_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.exit.split:
 | |
| ; CHECK-NEXT:    br label [[ENTRY_SPLIT_SPLIT:%.*]]
 | |
| ; CHECK:       entry.split.split:
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@merge_3..omp_par
 | |
| ; CHECK-SAME: (i32* noalias [[TID_ADDR:%.*]], i32* noalias [[ZERO_ADDR:%.*]], i32* [[A_ADDR:%.*]]) #[[ATTR0]] {
 | |
| ; CHECK-NEXT:  omp.par.entry:
 | |
| ; CHECK-NEXT:    [[TID_ADDR_LOCAL:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[TID_ADDR]], align 4
 | |
| ; CHECK-NEXT:    store i32 [[TMP0]], i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK-NEXT:    [[TID:%.*]] = load i32, i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_REGION:%.*]]
 | |
| ; CHECK:       omp.par.outlined.exit.exitStub:
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK:       omp.par.region:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_MERGED:%.*]]
 | |
| ; CHECK:       omp.par.merged:
 | |
| ; CHECK-NEXT:    call void @.omp_outlined..22(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB2]], i32 [[OMP_GLOBAL_THREAD_NUM]])
 | |
| ; CHECK-NEXT:    call void @.omp_outlined..23(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM1:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB2]], i32 [[OMP_GLOBAL_THREAD_NUM1]])
 | |
| ; CHECK-NEXT:    call void @.omp_outlined..24(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    br label [[ENTRY_SPLIT:%.*]]
 | |
| ; CHECK:       entry.split:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_REGION_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.region.split:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_PRE_FINALIZE:%.*]]
 | |
| ; CHECK:       omp.par.pre_finalize:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT_EXITSTUB:%.*]]
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..22
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..23
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..24
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@merge_3_seq
 | |
| ; CHECK-SAME: (i32 [[A:%.*]], i32 [[B:%.*]]) local_unnamed_addr {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[ADD1_SEQ_OUTPUT_ALLOC:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    [[ADD_SEQ_OUTPUT_ALLOC:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    [[A_ADDR:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    store i32 [[A]], i32* [[A_ADDR]], align 4
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM7:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    br label [[OMP_PARALLEL:%.*]]
 | |
| ; CHECK:       omp_parallel:
 | |
| ; CHECK-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB1]], i32 3, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*, i32*, i32*)* @merge_3_seq..omp_par to void (i32*, i32*, ...)*), i32* [[A_ADDR]], i32* [[ADD_SEQ_OUTPUT_ALLOC]], i32* [[ADD1_SEQ_OUTPUT_ALLOC]])
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT:%.*]]
 | |
| ; CHECK:       omp.par.outlined.exit:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_EXIT_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.exit.split:
 | |
| ; CHECK-NEXT:    br label [[ENTRY_SPLIT_SPLIT:%.*]]
 | |
| ; CHECK:       entry.split.split:
 | |
| ; CHECK-NEXT:    [[ADD1_SEQ_OUTPUT_LOAD:%.*]] = load i32, i32* [[ADD1_SEQ_OUTPUT_ALLOC]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[ADD1_SEQ_OUTPUT_LOAD]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@merge_3_seq..omp_par
 | |
| ; CHECK-SAME: (i32* noalias [[TID_ADDR:%.*]], i32* noalias [[ZERO_ADDR:%.*]], i32* [[A_ADDR:%.*]], i32* [[ADD_SEQ_OUTPUT_ALLOC:%.*]], i32* [[ADD1_SEQ_OUTPUT_ALLOC:%.*]]) #[[ATTR0]] {
 | |
| ; CHECK-NEXT:  omp.par.entry:
 | |
| ; CHECK-NEXT:    [[TID_ADDR_LOCAL:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[TID_ADDR]], align 4
 | |
| ; CHECK-NEXT:    store i32 [[TMP0]], i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK-NEXT:    [[TID:%.*]] = load i32, i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_REGION:%.*]]
 | |
| ; CHECK:       omp.par.outlined.exit.exitStub:
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK:       omp.par.region:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_MERGED:%.*]]
 | |
| ; CHECK:       omp.par.merged:
 | |
| ; CHECK-NEXT:    call void @.omp_outlined..25(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM2:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB2]], i32 [[OMP_GLOBAL_THREAD_NUM2]])
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    [[TMP1:%.*]] = call i32 @__kmpc_master(%struct.ident_t* @[[GLOB1]], i32 [[OMP_GLOBAL_THREAD_NUM]])
 | |
| ; CHECK-NEXT:    [[TMP2:%.*]] = icmp ne i32 [[TMP1]], 0
 | |
| ; CHECK-NEXT:    br i1 [[TMP2]], label [[OMP_REGION_BODY:%.*]], label [[OMP_REGION_END:%.*]]
 | |
| ; CHECK:       omp_region.end:
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM1:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB2]], i32 [[OMP_GLOBAL_THREAD_NUM1]])
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_MERGED_SPLIT_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.merged.split.split:
 | |
| ; CHECK-NEXT:    call void @.omp_outlined..26(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM4:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB2]], i32 [[OMP_GLOBAL_THREAD_NUM4]])
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM3:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    [[TMP3:%.*]] = call i32 @__kmpc_master(%struct.ident_t* @[[GLOB1]], i32 [[OMP_GLOBAL_THREAD_NUM3]])
 | |
| ; CHECK-NEXT:    [[TMP4:%.*]] = icmp ne i32 [[TMP3]], 0
 | |
| ; CHECK-NEXT:    br i1 [[TMP4]], label [[OMP_REGION_BODY5:%.*]], label [[OMP_REGION_END4:%.*]]
 | |
| ; CHECK:       omp_region.end4:
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM6:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB2]], i32 [[OMP_GLOBAL_THREAD_NUM6]])
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_MERGED_SPLIT_SPLIT_SPLIT_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.merged.split.split.split.split:
 | |
| ; CHECK-NEXT:    call void @.omp_outlined..27(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    br label [[ENTRY_SPLIT:%.*]]
 | |
| ; CHECK:       entry.split:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_REGION_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.region.split:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_PRE_FINALIZE:%.*]]
 | |
| ; CHECK:       omp.par.pre_finalize:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT_EXITSTUB:%.*]]
 | |
| ; CHECK:       omp_region.body5:
 | |
| ; CHECK-NEXT:    br label [[SEQ_PAR_MERGED2:%.*]]
 | |
| ; CHECK:       seq.par.merged2:
 | |
| ; CHECK-NEXT:    [[TMP5:%.*]] = load i32, i32* [[A_ADDR]], align 4
 | |
| ; CHECK-NEXT:    [[ADD_SEQ_OUTPUT_LOAD:%.*]] = load i32, i32* [[ADD_SEQ_OUTPUT_ALLOC]], align 4
 | |
| ; CHECK-NEXT:    [[ADD1:%.*]] = add nsw i32 [[ADD_SEQ_OUTPUT_LOAD]], [[TMP5]]
 | |
| ; CHECK-NEXT:    store i32 [[ADD1]], i32* [[ADD1_SEQ_OUTPUT_ALLOC]], align 4
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_MERGED_SPLIT_SPLIT_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.merged.split.split.split:
 | |
| ; CHECK-NEXT:    br label [[OMP_REGION_BODY5_SPLIT:%.*]]
 | |
| ; CHECK:       omp_region.body5.split:
 | |
| ; CHECK-NEXT:    call void @__kmpc_end_master(%struct.ident_t* @[[GLOB1]], i32 [[OMP_GLOBAL_THREAD_NUM3]])
 | |
| ; CHECK-NEXT:    br label [[OMP_REGION_END4]]
 | |
| ; CHECK:       omp_region.body:
 | |
| ; CHECK-NEXT:    br label [[SEQ_PAR_MERGED:%.*]]
 | |
| ; CHECK:       seq.par.merged:
 | |
| ; CHECK-NEXT:    [[TMP6:%.*]] = load i32, i32* [[A_ADDR]], align 4
 | |
| ; CHECK-NEXT:    [[ADD:%.*]] = add nsw i32 [[TMP6]], 1
 | |
| ; CHECK-NEXT:    store i32 [[ADD]], i32* [[ADD_SEQ_OUTPUT_ALLOC]], align 4
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_MERGED_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.merged.split:
 | |
| ; CHECK-NEXT:    br label [[OMP_REGION_BODY_SPLIT:%.*]]
 | |
| ; CHECK:       omp_region.body.split:
 | |
| ; CHECK-NEXT:    call void @__kmpc_end_master(%struct.ident_t* @[[GLOB1]], i32 [[OMP_GLOBAL_THREAD_NUM]])
 | |
| ; CHECK-NEXT:    br label [[OMP_REGION_END]]
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..25
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..26
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..27
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@unmergable_3_seq_call
 | |
| ; CHECK-SAME: (i32 [[A:%.*]]) local_unnamed_addr {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[A_ADDR:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    store i32 [[A]], i32* [[A_ADDR]], align 4
 | |
| ; CHECK-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]], i32 noundef 1, void (i32*, i32*, ...)* noundef bitcast (void (i32*, i32*, i32*)* @.omp_outlined..28 to void (i32*, i32*, ...)*), i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    call void (...) @foo()
 | |
| ; CHECK-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]], i32 noundef 1, void (i32*, i32*, ...)* noundef bitcast (void (i32*, i32*, i32*)* @.omp_outlined..29 to void (i32*, i32*, ...)*), i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    call void (...) @foo()
 | |
| ; CHECK-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]], i32 noundef 1, void (i32*, i32*, ...)* noundef bitcast (void (i32*, i32*, i32*)* @.omp_outlined..30 to void (i32*, i32*, ...)*), i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..28
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..29
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..30
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@unmergable_3_proc_bind
 | |
| ; CHECK-SAME: (i32 [[A:%.*]]) local_unnamed_addr {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[A_ADDR:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]])
 | |
| ; CHECK-NEXT:    store i32 [[A]], i32* [[A_ADDR]], align 4
 | |
| ; CHECK-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]], i32 noundef 1, void (i32*, i32*, ...)* noundef bitcast (void (i32*, i32*, i32*)* @.omp_outlined..31 to void (i32*, i32*, ...)*), i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    call void @__kmpc_push_proc_bind(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]], i32 [[TMP0]], i32 noundef 3)
 | |
| ; CHECK-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]], i32 noundef 1, void (i32*, i32*, ...)* noundef bitcast (void (i32*, i32*, i32*)* @.omp_outlined..32 to void (i32*, i32*, ...)*), i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]], i32 noundef 1, void (i32*, i32*, ...)* noundef bitcast (void (i32*, i32*, i32*)* @.omp_outlined..33 to void (i32*, i32*, ...)*), i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..31
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..32
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..33
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@unmergable_3_num_threads
 | |
| ; CHECK-SAME: (i32 [[A:%.*]]) local_unnamed_addr {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[A_ADDR:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]])
 | |
| ; CHECK-NEXT:    store i32 [[A]], i32* [[A_ADDR]], align 4
 | |
| ; CHECK-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]], i32 noundef 1, void (i32*, i32*, ...)* noundef bitcast (void (i32*, i32*, i32*)* @.omp_outlined..34 to void (i32*, i32*, ...)*), i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    [[TMP1:%.*]] = load i32, i32* [[A_ADDR]], align 4
 | |
| ; CHECK-NEXT:    call void @__kmpc_push_num_threads(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]], i32 [[TMP0]], i32 [[TMP1]])
 | |
| ; CHECK-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]], i32 noundef 1, void (i32*, i32*, ...)* noundef bitcast (void (i32*, i32*, i32*)* @.omp_outlined..35 to void (i32*, i32*, ...)*), i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]], i32 noundef 1, void (i32*, i32*, ...)* noundef bitcast (void (i32*, i32*, i32*)* @.omp_outlined..36 to void (i32*, i32*, ...)*), i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..34
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..35
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..36
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@merge_2_unmergable_1
 | |
| ; CHECK-SAME: (i32 [[A:%.*]]) local_unnamed_addr {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[A_ADDR:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    store i32 [[A]], i32* [[A_ADDR]], align 4
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    br label [[OMP_PARALLEL:%.*]]
 | |
| ; CHECK:       omp_parallel:
 | |
| ; CHECK-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB1]], i32 1, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*)* @merge_2_unmergable_1..omp_par to void (i32*, i32*, ...)*), i32* [[A_ADDR]])
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT:%.*]]
 | |
| ; CHECK:       omp.par.outlined.exit:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_EXIT_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.exit.split:
 | |
| ; CHECK-NEXT:    br label [[ENTRY_SPLIT_SPLIT:%.*]]
 | |
| ; CHECK:       entry.split.split:
 | |
| ; CHECK-NEXT:    call void (...) @foo()
 | |
| ; CHECK-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]], i32 noundef 1, void (i32*, i32*, ...)* noundef bitcast (void (i32*, i32*, i32*)* @.omp_outlined..39 to void (i32*, i32*, ...)*), i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@merge_2_unmergable_1..omp_par
 | |
| ; CHECK-SAME: (i32* noalias [[TID_ADDR:%.*]], i32* noalias [[ZERO_ADDR:%.*]], i32* [[A_ADDR:%.*]]) #[[ATTR0]] {
 | |
| ; CHECK-NEXT:  omp.par.entry:
 | |
| ; CHECK-NEXT:    [[TID_ADDR_LOCAL:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[TID_ADDR]], align 4
 | |
| ; CHECK-NEXT:    store i32 [[TMP0]], i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK-NEXT:    [[TID:%.*]] = load i32, i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_REGION:%.*]]
 | |
| ; CHECK:       omp.par.outlined.exit.exitStub:
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK:       omp.par.region:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_MERGED:%.*]]
 | |
| ; CHECK:       omp.par.merged:
 | |
| ; CHECK-NEXT:    call void @.omp_outlined..37(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB2]], i32 [[OMP_GLOBAL_THREAD_NUM]])
 | |
| ; CHECK-NEXT:    call void @.omp_outlined..38(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    br label [[ENTRY_SPLIT:%.*]]
 | |
| ; CHECK:       entry.split:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_REGION_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.region.split:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_PRE_FINALIZE:%.*]]
 | |
| ; CHECK:       omp.par.pre_finalize:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT_EXITSTUB:%.*]]
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..37
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..38
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..39
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@merge
 | |
| ; CHECK-SAME: (i32 [[A:%.*]]) local_unnamed_addr {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[A_ADDR:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    store i32 [[A]], i32* [[A_ADDR]], align 4
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    br label [[OMP_PARALLEL:%.*]]
 | |
| ; CHECK:       omp_parallel:
 | |
| ; CHECK-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB1]], i32 1, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*)* @merge..omp_par to void (i32*, i32*, ...)*), i32* [[A_ADDR]])
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT:%.*]]
 | |
| ; CHECK:       omp.par.outlined.exit:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_EXIT_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.exit.split:
 | |
| ; CHECK-NEXT:    br label [[ENTRY_SPLIT_SPLIT:%.*]]
 | |
| ; CHECK:       entry.split.split:
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@merge..omp_par
 | |
| ; CHECK-SAME: (i32* noalias [[TID_ADDR:%.*]], i32* noalias [[ZERO_ADDR:%.*]], i32* [[A_ADDR:%.*]]) #[[ATTR0]] {
 | |
| ; CHECK-NEXT:  omp.par.entry:
 | |
| ; CHECK-NEXT:    [[TID_ADDR_LOCAL:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[TID_ADDR]], align 4
 | |
| ; CHECK-NEXT:    store i32 [[TMP0]], i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK-NEXT:    [[TID:%.*]] = load i32, i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_REGION:%.*]]
 | |
| ; CHECK:       omp.par.outlined.exit.exitStub:
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK:       omp.par.region:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_MERGED:%.*]]
 | |
| ; CHECK:       omp.par.merged:
 | |
| ; CHECK-NEXT:    call void @.omp_outlined.(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB2]], i32 [[OMP_GLOBAL_THREAD_NUM]])
 | |
| ; CHECK-NEXT:    call void @.omp_outlined..1(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    br label [[ENTRY_SPLIT:%.*]]
 | |
| ; CHECK:       entry.split:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_REGION_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.region.split:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_PRE_FINALIZE:%.*]]
 | |
| ; CHECK:       omp.par.pre_finalize:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT_EXITSTUB:%.*]]
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined.
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..1
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@unmergable_proc_bind
 | |
| ; CHECK-SAME: (i32 [[A:%.*]]) local_unnamed_addr {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[A_ADDR:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]])
 | |
| ; CHECK-NEXT:    store i32 [[A]], i32* [[A_ADDR]], align 4
 | |
| ; CHECK-NEXT:    call void @__kmpc_push_proc_bind(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]], i32 [[TMP0]], i32 noundef 3)
 | |
| ; CHECK-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]], i32 noundef 1, void (i32*, i32*, ...)* noundef bitcast (void (i32*, i32*, i32*)* @.omp_outlined..2 to void (i32*, i32*, ...)*), i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]], i32 noundef 1, void (i32*, i32*, ...)* noundef bitcast (void (i32*, i32*, i32*)* @.omp_outlined..3 to void (i32*, i32*, ...)*), i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..2
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..3
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@unmergable_num_threads
 | |
| ; CHECK-SAME: (i32 [[A:%.*]]) local_unnamed_addr {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[A_ADDR:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]])
 | |
| ; CHECK-NEXT:    store i32 [[A]], i32* [[A_ADDR]], align 4
 | |
| ; CHECK-NEXT:    call void @__kmpc_push_num_threads(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]], i32 [[TMP0]], i32 [[A]])
 | |
| ; CHECK-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]], i32 noundef 1, void (i32*, i32*, ...)* noundef bitcast (void (i32*, i32*, i32*)* @.omp_outlined..4 to void (i32*, i32*, ...)*), i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]], i32 noundef 1, void (i32*, i32*, ...)* noundef bitcast (void (i32*, i32*, i32*)* @.omp_outlined..5 to void (i32*, i32*, ...)*), i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..4
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..5
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@unmergable_seq_call
 | |
| ; CHECK-SAME: (i32 [[A:%.*]]) local_unnamed_addr {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[A_ADDR:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    store i32 [[A]], i32* [[A_ADDR]], align 4
 | |
| ; CHECK-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]], i32 noundef 1, void (i32*, i32*, ...)* noundef bitcast (void (i32*, i32*, i32*)* @.omp_outlined..6 to void (i32*, i32*, ...)*), i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    call void (...) @foo()
 | |
| ; CHECK-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]], i32 noundef 1, void (i32*, i32*, ...)* noundef bitcast (void (i32*, i32*, i32*)* @.omp_outlined..7 to void (i32*, i32*, ...)*), i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..6
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..7
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@merge_seq
 | |
| ; CHECK-SAME: (i32 [[A:%.*]]) local_unnamed_addr {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[A_ADDR:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    store i32 [[A]], i32* [[A_ADDR]], align 4
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM2:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    br label [[OMP_PARALLEL:%.*]]
 | |
| ; CHECK:       omp_parallel:
 | |
| ; CHECK-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB1]], i32 1, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*)* @merge_seq..omp_par to void (i32*, i32*, ...)*), i32* [[A_ADDR]])
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT:%.*]]
 | |
| ; CHECK:       omp.par.outlined.exit:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_EXIT_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.exit.split:
 | |
| ; CHECK-NEXT:    br label [[ENTRY_SPLIT_SPLIT:%.*]]
 | |
| ; CHECK:       entry.split.split:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A_ADDR]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@merge_seq..omp_par
 | |
| ; CHECK-SAME: (i32* noalias [[TID_ADDR:%.*]], i32* noalias [[ZERO_ADDR:%.*]], i32* [[A_ADDR:%.*]]) #[[ATTR0]] {
 | |
| ; CHECK-NEXT:  omp.par.entry:
 | |
| ; CHECK-NEXT:    [[TID_ADDR_LOCAL:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[TID_ADDR]], align 4
 | |
| ; CHECK-NEXT:    store i32 [[TMP0]], i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK-NEXT:    [[TID:%.*]] = load i32, i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_REGION:%.*]]
 | |
| ; CHECK:       omp.par.outlined.exit.exitStub:
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK:       omp.par.region:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_MERGED:%.*]]
 | |
| ; CHECK:       omp.par.merged:
 | |
| ; CHECK-NEXT:    call void @.omp_outlined..8(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM2:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB2]], i32 [[OMP_GLOBAL_THREAD_NUM2]])
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    [[TMP1:%.*]] = call i32 @__kmpc_master(%struct.ident_t* @[[GLOB1]], i32 [[OMP_GLOBAL_THREAD_NUM]])
 | |
| ; CHECK-NEXT:    [[TMP2:%.*]] = icmp ne i32 [[TMP1]], 0
 | |
| ; CHECK-NEXT:    br i1 [[TMP2]], label [[OMP_REGION_BODY:%.*]], label [[OMP_REGION_END:%.*]]
 | |
| ; CHECK:       omp_region.end:
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM1:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB2]], i32 [[OMP_GLOBAL_THREAD_NUM1]])
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_MERGED_SPLIT_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.merged.split.split:
 | |
| ; CHECK-NEXT:    call void @.omp_outlined..9(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    br label [[ENTRY_SPLIT:%.*]]
 | |
| ; CHECK:       entry.split:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_REGION_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.region.split:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_PRE_FINALIZE:%.*]]
 | |
| ; CHECK:       omp.par.pre_finalize:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT_EXITSTUB:%.*]]
 | |
| ; CHECK:       omp_region.body:
 | |
| ; CHECK-NEXT:    br label [[SEQ_PAR_MERGED:%.*]]
 | |
| ; CHECK:       seq.par.merged:
 | |
| ; CHECK-NEXT:    [[TMP3:%.*]] = load i32, i32* [[A_ADDR]], align 4
 | |
| ; CHECK-NEXT:    [[ADD:%.*]] = add nsw i32 [[TMP3]], 1
 | |
| ; CHECK-NEXT:    store i32 [[ADD]], i32* [[A_ADDR]], align 4
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_MERGED_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.merged.split:
 | |
| ; CHECK-NEXT:    br label [[OMP_REGION_BODY_SPLIT:%.*]]
 | |
| ; CHECK:       omp_region.body.split:
 | |
| ; CHECK-NEXT:    call void @__kmpc_end_master(%struct.ident_t* @[[GLOB1]], i32 [[OMP_GLOBAL_THREAD_NUM]])
 | |
| ; CHECK-NEXT:    br label [[OMP_REGION_END]]
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..8
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..9
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@merge_seq_float
 | |
| ; CHECK-SAME: (float [[F:%.*]], float* nocapture nofree writeonly [[P:%.*]]) local_unnamed_addr {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[F_ADDR:%.*]] = alloca float, align 4
 | |
| ; CHECK-NEXT:    store float [[F]], float* [[F_ADDR]], align 4
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM2:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    br label [[OMP_PARALLEL:%.*]]
 | |
| ; CHECK:       omp_parallel:
 | |
| ; CHECK-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB1]], i32 2, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, float*, float*)* @merge_seq_float..omp_par to void (i32*, i32*, ...)*), float* [[F_ADDR]], float* [[P]])
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT:%.*]]
 | |
| ; CHECK:       omp.par.outlined.exit:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_EXIT_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.exit.split:
 | |
| ; CHECK-NEXT:    br label [[ENTRY_SPLIT_SPLIT:%.*]]
 | |
| ; CHECK:       entry.split.split:
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@merge_seq_float..omp_par
 | |
| ; CHECK-SAME: (i32* noalias [[TID_ADDR:%.*]], i32* noalias [[ZERO_ADDR:%.*]], float* [[F_ADDR:%.*]], float* [[P:%.*]]) #[[ATTR0]] {
 | |
| ; CHECK-NEXT:  omp.par.entry:
 | |
| ; CHECK-NEXT:    [[TID_ADDR_LOCAL:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[TID_ADDR]], align 4
 | |
| ; CHECK-NEXT:    store i32 [[TMP0]], i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK-NEXT:    [[TID:%.*]] = load i32, i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_REGION:%.*]]
 | |
| ; CHECK:       omp.par.outlined.exit.exitStub:
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK:       omp.par.region:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_MERGED:%.*]]
 | |
| ; CHECK:       omp.par.merged:
 | |
| ; CHECK-NEXT:    call void @.omp_outlined..10(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], float* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[F_ADDR]])
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM2:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB2]], i32 [[OMP_GLOBAL_THREAD_NUM2]])
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    [[TMP1:%.*]] = call i32 @__kmpc_master(%struct.ident_t* @[[GLOB1]], i32 [[OMP_GLOBAL_THREAD_NUM]])
 | |
| ; CHECK-NEXT:    [[TMP2:%.*]] = icmp ne i32 [[TMP1]], 0
 | |
| ; CHECK-NEXT:    br i1 [[TMP2]], label [[OMP_REGION_BODY:%.*]], label [[OMP_REGION_END:%.*]]
 | |
| ; CHECK:       omp_region.end:
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM1:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB2]], i32 [[OMP_GLOBAL_THREAD_NUM1]])
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_MERGED_SPLIT_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.merged.split.split:
 | |
| ; CHECK-NEXT:    call void @.omp_outlined..11(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], float* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[F_ADDR]])
 | |
| ; CHECK-NEXT:    br label [[ENTRY_SPLIT:%.*]]
 | |
| ; CHECK:       entry.split:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_REGION_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.region.split:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_PRE_FINALIZE:%.*]]
 | |
| ; CHECK:       omp.par.pre_finalize:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT_EXITSTUB:%.*]]
 | |
| ; CHECK:       omp_region.body:
 | |
| ; CHECK-NEXT:    br label [[SEQ_PAR_MERGED:%.*]]
 | |
| ; CHECK:       seq.par.merged:
 | |
| ; CHECK-NEXT:    [[TMP3:%.*]] = load float, float* [[F_ADDR]], align 4
 | |
| ; CHECK-NEXT:    [[ADD:%.*]] = fadd float [[TMP3]], 0x40091EB860000000
 | |
| ; CHECK-NEXT:    store float [[ADD]], float* [[P]], align 4
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_MERGED_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.merged.split:
 | |
| ; CHECK-NEXT:    br label [[OMP_REGION_BODY_SPLIT:%.*]]
 | |
| ; CHECK:       omp_region.body.split:
 | |
| ; CHECK-NEXT:    call void @__kmpc_end_master(%struct.ident_t* @[[GLOB1]], i32 [[OMP_GLOBAL_THREAD_NUM]])
 | |
| ; CHECK-NEXT:    br label [[OMP_REGION_END]]
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..10
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], float* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[F:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load float, float* [[F]], align 4
 | |
| ; CHECK-NEXT:    [[CONV:%.*]] = fptosi float [[TMP0]] to i32
 | |
| ; CHECK-NEXT:    call void @use(i32 [[CONV]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..11
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], float* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[F:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load float, float* [[F]], align 4
 | |
| ; CHECK-NEXT:    [[CONV:%.*]] = fptosi float [[TMP0]] to i32
 | |
| ; CHECK-NEXT:    call void @use(i32 [[CONV]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@merge_seq_firstprivate
 | |
| ; CHECK-SAME: (i32 [[A:%.*]]) local_unnamed_addr {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[A_CASTED_SROA_0_0_INSERT_EXT_SEQ_OUTPUT_ALLOC:%.*]] = alloca i64, align 8
 | |
| ; CHECK-NEXT:    [[A_ADDR:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    store i32 [[A]], i32* [[A_ADDR]], align 4
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM2:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    br label [[OMP_PARALLEL:%.*]]
 | |
| ; CHECK:       omp_parallel:
 | |
| ; CHECK-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB1]], i32 2, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*, i64*)* @merge_seq_firstprivate..omp_par to void (i32*, i32*, ...)*), i32* [[A_ADDR]], i64* [[A_CASTED_SROA_0_0_INSERT_EXT_SEQ_OUTPUT_ALLOC]])
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT:%.*]]
 | |
| ; CHECK:       omp.par.outlined.exit:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_EXIT_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.exit.split:
 | |
| ; CHECK-NEXT:    br label [[ENTRY_SPLIT_SPLIT:%.*]]
 | |
| ; CHECK:       entry.split.split:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A_ADDR]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@merge_seq_firstprivate..omp_par
 | |
| ; CHECK-SAME: (i32* noalias [[TID_ADDR:%.*]], i32* noalias [[ZERO_ADDR:%.*]], i32* [[A_ADDR:%.*]], i64* [[A_CASTED_SROA_0_0_INSERT_EXT_SEQ_OUTPUT_ALLOC:%.*]]) #[[ATTR0]] {
 | |
| ; CHECK-NEXT:  omp.par.entry:
 | |
| ; CHECK-NEXT:    [[TID_ADDR_LOCAL:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[TID_ADDR]], align 4
 | |
| ; CHECK-NEXT:    store i32 [[TMP0]], i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK-NEXT:    [[TID:%.*]] = load i32, i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_REGION:%.*]]
 | |
| ; CHECK:       omp.par.outlined.exit.exitStub:
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK:       omp.par.region:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_MERGED:%.*]]
 | |
| ; CHECK:       omp.par.merged:
 | |
| ; CHECK-NEXT:    call void @.omp_outlined..12(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM2:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB2]], i32 [[OMP_GLOBAL_THREAD_NUM2]])
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    [[TMP1:%.*]] = call i32 @__kmpc_master(%struct.ident_t* @[[GLOB1]], i32 [[OMP_GLOBAL_THREAD_NUM]])
 | |
| ; CHECK-NEXT:    [[TMP2:%.*]] = icmp ne i32 [[TMP1]], 0
 | |
| ; CHECK-NEXT:    br i1 [[TMP2]], label [[OMP_REGION_BODY:%.*]], label [[OMP_REGION_END:%.*]]
 | |
| ; CHECK:       omp_region.end:
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM1:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB2]], i32 [[OMP_GLOBAL_THREAD_NUM1]])
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_MERGED_SPLIT_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.merged.split.split:
 | |
| ; CHECK-NEXT:    [[A_CASTED_SROA_0_0_INSERT_EXT_SEQ_OUTPUT_LOAD:%.*]] = load i64, i64* [[A_CASTED_SROA_0_0_INSERT_EXT_SEQ_OUTPUT_ALLOC]], align 8
 | |
| ; CHECK-NEXT:    call void @.omp_outlined..13(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i64 [[A_CASTED_SROA_0_0_INSERT_EXT_SEQ_OUTPUT_LOAD]])
 | |
| ; CHECK-NEXT:    br label [[ENTRY_SPLIT:%.*]]
 | |
| ; CHECK:       entry.split:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_REGION_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.region.split:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_PRE_FINALIZE:%.*]]
 | |
| ; CHECK:       omp.par.pre_finalize:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT_EXITSTUB:%.*]]
 | |
| ; CHECK:       omp_region.body:
 | |
| ; CHECK-NEXT:    br label [[SEQ_PAR_MERGED:%.*]]
 | |
| ; CHECK:       seq.par.merged:
 | |
| ; CHECK-NEXT:    [[TMP3:%.*]] = load i32, i32* [[A_ADDR]], align 4
 | |
| ; CHECK-NEXT:    [[ADD:%.*]] = add nsw i32 [[TMP3]], 1
 | |
| ; CHECK-NEXT:    store i32 [[ADD]], i32* [[A_ADDR]], align 4
 | |
| ; CHECK-NEXT:    [[A_CASTED_SROA_0_0_INSERT_EXT:%.*]] = zext i32 [[ADD]] to i64
 | |
| ; CHECK-NEXT:    store i64 [[A_CASTED_SROA_0_0_INSERT_EXT]], i64* [[A_CASTED_SROA_0_0_INSERT_EXT_SEQ_OUTPUT_ALLOC]], align 8
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_MERGED_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.merged.split:
 | |
| ; CHECK-NEXT:    br label [[OMP_REGION_BODY_SPLIT:%.*]]
 | |
| ; CHECK:       omp_region.body.split:
 | |
| ; CHECK-NEXT:    call void @__kmpc_end_master(%struct.ident_t* @[[GLOB1]], i32 [[OMP_GLOBAL_THREAD_NUM]])
 | |
| ; CHECK-NEXT:    br label [[OMP_REGION_END]]
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..12
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..13
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i64 [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[A_ADDR_SROA_0_0_EXTRACT_TRUNC:%.*]] = trunc i64 [[A]] to i32
 | |
| ; CHECK-NEXT:    call void @use(i32 [[A_ADDR_SROA_0_0_EXTRACT_TRUNC]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@merge_seq_sink_lt
 | |
| ; CHECK-SAME: (i32 [[A:%.*]]) local_unnamed_addr {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[A_ADDR:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    store i32 [[A]], i32* [[A_ADDR]], align 4
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM2:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    br label [[OMP_PARALLEL:%.*]]
 | |
| ; CHECK:       omp_parallel:
 | |
| ; CHECK-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB1]], i32 1, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*)* @merge_seq_sink_lt..omp_par to void (i32*, i32*, ...)*), i32* [[A_ADDR]])
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT:%.*]]
 | |
| ; CHECK:       omp.par.outlined.exit:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_EXIT_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.exit.split:
 | |
| ; CHECK-NEXT:    br label [[ENTRY_SPLIT_SPLIT:%.*]]
 | |
| ; CHECK:       entry.split.split:
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@merge_seq_sink_lt..omp_par
 | |
| ; CHECK-SAME: (i32* noalias [[TID_ADDR:%.*]], i32* noalias [[ZERO_ADDR:%.*]], i32* [[A_ADDR:%.*]]) #[[ATTR0]] {
 | |
| ; CHECK-NEXT:  omp.par.entry:
 | |
| ; CHECK-NEXT:    [[B:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    [[TID_ADDR_LOCAL:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[TID_ADDR]], align 4
 | |
| ; CHECK-NEXT:    store i32 [[TMP0]], i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK-NEXT:    [[TID:%.*]] = load i32, i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_REGION:%.*]]
 | |
| ; CHECK:       omp.par.outlined.exit.exitStub:
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK:       omp.par.region:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_MERGED:%.*]]
 | |
| ; CHECK:       omp.par.merged:
 | |
| ; CHECK-NEXT:    call void @.omp_outlined..14(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM2:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB2]], i32 [[OMP_GLOBAL_THREAD_NUM2]])
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    [[TMP1:%.*]] = call i32 @__kmpc_master(%struct.ident_t* @[[GLOB1]], i32 [[OMP_GLOBAL_THREAD_NUM]])
 | |
| ; CHECK-NEXT:    [[TMP2:%.*]] = icmp ne i32 [[TMP1]], 0
 | |
| ; CHECK-NEXT:    br i1 [[TMP2]], label [[OMP_REGION_BODY:%.*]], label [[OMP_REGION_END:%.*]]
 | |
| ; CHECK:       omp_region.end:
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM1:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB2]], i32 [[OMP_GLOBAL_THREAD_NUM1]])
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_MERGED_SPLIT_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.merged.split.split:
 | |
| ; CHECK-NEXT:    call void @.omp_outlined..15(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    br label [[ENTRY_SPLIT:%.*]]
 | |
| ; CHECK:       entry.split:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_REGION_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.region.split:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_PRE_FINALIZE:%.*]]
 | |
| ; CHECK:       omp.par.pre_finalize:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT_EXITSTUB:%.*]]
 | |
| ; CHECK:       omp_region.body:
 | |
| ; CHECK-NEXT:    br label [[SEQ_PAR_MERGED:%.*]]
 | |
| ; CHECK:       seq.par.merged:
 | |
| ; CHECK-NEXT:    [[TMP3:%.*]] = bitcast i32* [[B]] to i8*
 | |
| ; CHECK-NEXT:    call void @llvm.lifetime.start.p0i8(i64 noundef 4, i8* noundef nonnull [[TMP3]])
 | |
| ; CHECK-NEXT:    [[TMP4:%.*]] = ptrtoint i32* [[B]] to i64
 | |
| ; CHECK-NEXT:    [[TMP5:%.*]] = trunc i64 [[TMP4]] to i32
 | |
| ; CHECK-NEXT:    store i32 [[TMP5]], i32* [[B]], align 4
 | |
| ; CHECK-NEXT:    call void @llvm.lifetime.end.p0i8(i64 noundef 4, i8* noundef nonnull [[TMP3]])
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_MERGED_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.merged.split:
 | |
| ; CHECK-NEXT:    br label [[OMP_REGION_BODY_SPLIT:%.*]]
 | |
| ; CHECK:       omp_region.body.split:
 | |
| ; CHECK-NEXT:    call void @__kmpc_end_master(%struct.ident_t* @[[GLOB1]], i32 [[OMP_GLOBAL_THREAD_NUM]])
 | |
| ; CHECK-NEXT:    br label [[OMP_REGION_END]]
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..14
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..15
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@merge_seq_par_use
 | |
| ; CHECK-SAME: (i32 [[A:%.*]]) local_unnamed_addr {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[A_ADDR:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    [[B:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    store i32 [[A]], i32* [[A_ADDR]], align 4
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM2:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    br label [[OMP_PARALLEL:%.*]]
 | |
| ; CHECK:       omp_parallel:
 | |
| ; CHECK-NEXT:    [[LT_CAST3:%.*]] = bitcast i32* [[B]] to i8*
 | |
| ; CHECK-NEXT:    call void @llvm.lifetime.start.p0i8(i64 -1, i8* [[LT_CAST3]])
 | |
| ; CHECK-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB1]], i32 2, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*, i32*)* @merge_seq_par_use..omp_par to void (i32*, i32*, ...)*), i32* [[A_ADDR]], i32* [[B]])
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT:%.*]]
 | |
| ; CHECK:       omp.par.outlined.exit:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_EXIT_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.exit.split:
 | |
| ; CHECK-NEXT:    br label [[ENTRY_SPLIT_SPLIT:%.*]]
 | |
| ; CHECK:       entry.split.split:
 | |
| ; CHECK-NEXT:    [[LT_CAST:%.*]] = bitcast i32* [[B]] to i8*
 | |
| ; CHECK-NEXT:    call void @llvm.lifetime.end.p0i8(i64 noundef 4, i8* noundef nonnull [[LT_CAST]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@merge_seq_par_use..omp_par
 | |
| ; CHECK-SAME: (i32* noalias [[TID_ADDR:%.*]], i32* noalias [[ZERO_ADDR:%.*]], i32* [[A_ADDR:%.*]], i32* [[B:%.*]]) #[[ATTR0]] {
 | |
| ; CHECK-NEXT:  omp.par.entry:
 | |
| ; CHECK-NEXT:    [[TID_ADDR_LOCAL:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[TID_ADDR]], align 4
 | |
| ; CHECK-NEXT:    store i32 [[TMP0]], i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK-NEXT:    [[TID:%.*]] = load i32, i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_REGION:%.*]]
 | |
| ; CHECK:       omp.par.outlined.exit.exitStub:
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK:       omp.par.region:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_MERGED:%.*]]
 | |
| ; CHECK:       omp.par.merged:
 | |
| ; CHECK-NEXT:    call void @.omp_outlined..16(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM2:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB2]], i32 [[OMP_GLOBAL_THREAD_NUM2]])
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    [[TMP1:%.*]] = call i32 @__kmpc_master(%struct.ident_t* @[[GLOB1]], i32 [[OMP_GLOBAL_THREAD_NUM]])
 | |
| ; CHECK-NEXT:    [[TMP2:%.*]] = icmp ne i32 [[TMP1]], 0
 | |
| ; CHECK-NEXT:    br i1 [[TMP2]], label [[OMP_REGION_BODY:%.*]], label [[OMP_REGION_END:%.*]]
 | |
| ; CHECK:       omp_region.end:
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM1:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB2]], i32 [[OMP_GLOBAL_THREAD_NUM1]])
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_MERGED_SPLIT_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.merged.split.split:
 | |
| ; CHECK-NEXT:    call void @.omp_outlined..17(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[B]])
 | |
| ; CHECK-NEXT:    br label [[ENTRY_SPLIT:%.*]]
 | |
| ; CHECK:       entry.split:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_REGION_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.region.split:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_PRE_FINALIZE:%.*]]
 | |
| ; CHECK:       omp.par.pre_finalize:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT_EXITSTUB:%.*]]
 | |
| ; CHECK:       omp_region.body:
 | |
| ; CHECK-NEXT:    br label [[SEQ_PAR_MERGED:%.*]]
 | |
| ; CHECK:       seq.par.merged:
 | |
| ; CHECK-NEXT:    [[TMP3:%.*]] = bitcast i32* [[B]] to i8*
 | |
| ; CHECK-NEXT:    [[TMP4:%.*]] = load i32, i32* [[A_ADDR]], align 4
 | |
| ; CHECK-NEXT:    [[ADD:%.*]] = add nsw i32 [[TMP4]], 1
 | |
| ; CHECK-NEXT:    store i32 [[ADD]], i32* [[B]], align 4
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_MERGED_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.merged.split:
 | |
| ; CHECK-NEXT:    br label [[OMP_REGION_BODY_SPLIT:%.*]]
 | |
| ; CHECK:       omp_region.body.split:
 | |
| ; CHECK-NEXT:    call void @__kmpc_end_master(%struct.ident_t* @[[GLOB1]], i32 [[OMP_GLOBAL_THREAD_NUM]])
 | |
| ; CHECK-NEXT:    br label [[OMP_REGION_END]]
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..16
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..17
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[B:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    [[TMP1:%.*]] = load i32, i32* [[B]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP1]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@merge_cancellable_regions
 | |
| ; CHECK-SAME: (i32 [[CANCEL1:%.*]], i32 [[CANCEL2:%.*]]) local_unnamed_addr {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[CANCEL1_ADDR:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    [[CANCEL2_ADDR:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    store i32 [[CANCEL1]], i32* [[CANCEL1_ADDR]], align 4
 | |
| ; CHECK-NEXT:    store i32 [[CANCEL2]], i32* [[CANCEL2_ADDR]], align 4
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    br label [[OMP_PARALLEL:%.*]]
 | |
| ; CHECK:       omp_parallel:
 | |
| ; CHECK-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB1]], i32 2, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*, i32*)* @merge_cancellable_regions..omp_par to void (i32*, i32*, ...)*), i32* [[CANCEL1_ADDR]], i32* [[CANCEL2_ADDR]])
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT:%.*]]
 | |
| ; CHECK:       omp.par.outlined.exit:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_EXIT_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.exit.split:
 | |
| ; CHECK-NEXT:    br label [[ENTRY_SPLIT_SPLIT:%.*]]
 | |
| ; CHECK:       entry.split.split:
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@merge_cancellable_regions..omp_par
 | |
| ; CHECK-SAME: (i32* noalias [[TID_ADDR:%.*]], i32* noalias [[ZERO_ADDR:%.*]], i32* [[CANCEL1_ADDR:%.*]], i32* [[CANCEL2_ADDR:%.*]]) #[[ATTR0]] {
 | |
| ; CHECK-NEXT:  omp.par.entry:
 | |
| ; CHECK-NEXT:    [[TID_ADDR_LOCAL:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[TID_ADDR]], align 4
 | |
| ; CHECK-NEXT:    store i32 [[TMP0]], i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK-NEXT:    [[TID:%.*]] = load i32, i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_REGION:%.*]]
 | |
| ; CHECK:       omp.par.outlined.exit.exitStub:
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK:       omp.par.region:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_MERGED:%.*]]
 | |
| ; CHECK:       omp.par.merged:
 | |
| ; CHECK-NEXT:    call void @.omp_outlined..18(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[CANCEL1_ADDR]])
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB2]], i32 [[OMP_GLOBAL_THREAD_NUM]])
 | |
| ; CHECK-NEXT:    call void @.omp_outlined..19(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[CANCEL2_ADDR]])
 | |
| ; CHECK-NEXT:    br label [[ENTRY_SPLIT:%.*]]
 | |
| ; CHECK:       entry.split:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_REGION_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.region.split:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_PRE_FINALIZE:%.*]]
 | |
| ; CHECK:       omp.par.pre_finalize:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT_EXITSTUB:%.*]]
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..18
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readonly [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[CANCEL1:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[CANCEL1]], align 4
 | |
| ; CHECK-NEXT:    [[TOBOOL_NOT:%.*]] = icmp eq i32 [[TMP0]], 0
 | |
| ; CHECK-NEXT:    br i1 [[TOBOOL_NOT]], label [[IF_END:%.*]], label [[IF_THEN:%.*]]
 | |
| ; CHECK:       if.then:
 | |
| ; CHECK-NEXT:    [[TMP1:%.*]] = load i32, i32* [[DOTGLOBAL_TID_]], align 4
 | |
| ; CHECK-NEXT:    [[TMP2:%.*]] = call i32 @__kmpc_cancel(%struct.ident_t* noundef nonnull @[[GLOB1]], i32 [[TMP1]], i32 noundef 1)
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK:       if.end:
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..19
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readonly [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[CANCEL2:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[CANCEL2]], align 4
 | |
| ; CHECK-NEXT:    [[TOBOOL_NOT:%.*]] = icmp eq i32 [[TMP0]], 0
 | |
| ; CHECK-NEXT:    br i1 [[TOBOOL_NOT]], label [[IF_END:%.*]], label [[IF_THEN:%.*]]
 | |
| ; CHECK:       if.then:
 | |
| ; CHECK-NEXT:    [[TMP1:%.*]] = load i32, i32* [[DOTGLOBAL_TID_]], align 4
 | |
| ; CHECK-NEXT:    [[TMP2:%.*]] = call i32 @__kmpc_cancel(%struct.ident_t* noundef nonnull @[[GLOB1]], i32 [[TMP1]], i32 noundef 1)
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK:       if.end:
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@merge_cancellable_regions_seq
 | |
| ; CHECK-SAME: (i32 [[CANCEL1:%.*]], i32 [[CANCEL2:%.*]]) local_unnamed_addr {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[CANCEL1_ADDR:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    [[CANCEL2_ADDR:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    store i32 [[CANCEL1]], i32* [[CANCEL1_ADDR]], align 4
 | |
| ; CHECK-NEXT:    store i32 [[CANCEL2]], i32* [[CANCEL2_ADDR]], align 4
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM2:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    br label [[OMP_PARALLEL:%.*]]
 | |
| ; CHECK:       omp_parallel:
 | |
| ; CHECK-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB1]], i32 2, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*, i32*)* @merge_cancellable_regions_seq..omp_par to void (i32*, i32*, ...)*), i32* [[CANCEL1_ADDR]], i32* [[CANCEL2_ADDR]])
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT:%.*]]
 | |
| ; CHECK:       omp.par.outlined.exit:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_EXIT_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.exit.split:
 | |
| ; CHECK-NEXT:    br label [[ENTRY_SPLIT_SPLIT:%.*]]
 | |
| ; CHECK:       entry.split.split:
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@merge_cancellable_regions_seq..omp_par
 | |
| ; CHECK-SAME: (i32* noalias [[TID_ADDR:%.*]], i32* noalias [[ZERO_ADDR:%.*]], i32* [[CANCEL1_ADDR:%.*]], i32* [[CANCEL2_ADDR:%.*]]) #[[ATTR0]] {
 | |
| ; CHECK-NEXT:  omp.par.entry:
 | |
| ; CHECK-NEXT:    [[TID_ADDR_LOCAL:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[TID_ADDR]], align 4
 | |
| ; CHECK-NEXT:    store i32 [[TMP0]], i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK-NEXT:    [[TID:%.*]] = load i32, i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_REGION:%.*]]
 | |
| ; CHECK:       omp.par.outlined.exit.exitStub:
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK:       omp.par.region:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_MERGED:%.*]]
 | |
| ; CHECK:       omp.par.merged:
 | |
| ; CHECK-NEXT:    call void @.omp_outlined..20(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[CANCEL1_ADDR]])
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM2:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB2]], i32 [[OMP_GLOBAL_THREAD_NUM2]])
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    [[TMP1:%.*]] = call i32 @__kmpc_master(%struct.ident_t* @[[GLOB1]], i32 [[OMP_GLOBAL_THREAD_NUM]])
 | |
| ; CHECK-NEXT:    [[TMP2:%.*]] = icmp ne i32 [[TMP1]], 0
 | |
| ; CHECK-NEXT:    br i1 [[TMP2]], label [[OMP_REGION_BODY:%.*]], label [[OMP_REGION_END:%.*]]
 | |
| ; CHECK:       omp_region.end:
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM1:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB2]], i32 [[OMP_GLOBAL_THREAD_NUM1]])
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_MERGED_SPLIT_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.merged.split.split:
 | |
| ; CHECK-NEXT:    call void @.omp_outlined..21(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[CANCEL2_ADDR]])
 | |
| ; CHECK-NEXT:    br label [[ENTRY_SPLIT:%.*]]
 | |
| ; CHECK:       entry.split:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_REGION_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.region.split:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_PRE_FINALIZE:%.*]]
 | |
| ; CHECK:       omp.par.pre_finalize:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT_EXITSTUB:%.*]]
 | |
| ; CHECK:       omp_region.body:
 | |
| ; CHECK-NEXT:    br label [[SEQ_PAR_MERGED:%.*]]
 | |
| ; CHECK:       seq.par.merged:
 | |
| ; CHECK-NEXT:    [[TMP3:%.*]] = load i32, i32* [[CANCEL1_ADDR]], align 4
 | |
| ; CHECK-NEXT:    [[TOBOOL_NOT:%.*]] = icmp eq i32 [[TMP3]], 0
 | |
| ; CHECK-NEXT:    [[LNOT_EXT:%.*]] = zext i1 [[TOBOOL_NOT]] to i32
 | |
| ; CHECK-NEXT:    store i32 [[LNOT_EXT]], i32* [[CANCEL2_ADDR]], align 4
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_MERGED_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.merged.split:
 | |
| ; CHECK-NEXT:    br label [[OMP_REGION_BODY_SPLIT:%.*]]
 | |
| ; CHECK:       omp_region.body.split:
 | |
| ; CHECK-NEXT:    call void @__kmpc_end_master(%struct.ident_t* @[[GLOB1]], i32 [[OMP_GLOBAL_THREAD_NUM]])
 | |
| ; CHECK-NEXT:    br label [[OMP_REGION_END]]
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..20
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readonly [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[CANCEL1:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[CANCEL1]], align 4
 | |
| ; CHECK-NEXT:    [[TOBOOL_NOT:%.*]] = icmp eq i32 [[TMP0]], 0
 | |
| ; CHECK-NEXT:    br i1 [[TOBOOL_NOT]], label [[IF_END:%.*]], label [[IF_THEN:%.*]]
 | |
| ; CHECK:       if.then:
 | |
| ; CHECK-NEXT:    [[TMP1:%.*]] = load i32, i32* [[DOTGLOBAL_TID_]], align 4
 | |
| ; CHECK-NEXT:    [[TMP2:%.*]] = call i32 @__kmpc_cancel(%struct.ident_t* noundef nonnull @[[GLOB1]], i32 [[TMP1]], i32 noundef 1)
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK:       if.end:
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..21
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readonly [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[CANCEL2:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[CANCEL2]], align 4
 | |
| ; CHECK-NEXT:    [[TOBOOL_NOT:%.*]] = icmp eq i32 [[TMP0]], 0
 | |
| ; CHECK-NEXT:    br i1 [[TOBOOL_NOT]], label [[IF_END:%.*]], label [[IF_THEN:%.*]]
 | |
| ; CHECK:       if.then:
 | |
| ; CHECK-NEXT:    [[TMP1:%.*]] = load i32, i32* [[DOTGLOBAL_TID_]], align 4
 | |
| ; CHECK-NEXT:    [[TMP2:%.*]] = call i32 @__kmpc_cancel(%struct.ident_t* noundef nonnull @[[GLOB1]], i32 [[TMP1]], i32 noundef 1)
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK:       if.end:
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@merge_3
 | |
| ; CHECK-SAME: (i32 [[A:%.*]]) local_unnamed_addr {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[A_ADDR:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    store i32 [[A]], i32* [[A_ADDR]], align 4
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    br label [[OMP_PARALLEL:%.*]]
 | |
| ; CHECK:       omp_parallel:
 | |
| ; CHECK-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB1]], i32 1, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*)* @merge_3..omp_par to void (i32*, i32*, ...)*), i32* [[A_ADDR]])
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT:%.*]]
 | |
| ; CHECK:       omp.par.outlined.exit:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_EXIT_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.exit.split:
 | |
| ; CHECK-NEXT:    br label [[ENTRY_SPLIT_SPLIT:%.*]]
 | |
| ; CHECK:       entry.split.split:
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@merge_3..omp_par
 | |
| ; CHECK-SAME: (i32* noalias [[TID_ADDR:%.*]], i32* noalias [[ZERO_ADDR:%.*]], i32* [[A_ADDR:%.*]]) #[[ATTR0]] {
 | |
| ; CHECK-NEXT:  omp.par.entry:
 | |
| ; CHECK-NEXT:    [[TID_ADDR_LOCAL:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[TID_ADDR]], align 4
 | |
| ; CHECK-NEXT:    store i32 [[TMP0]], i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK-NEXT:    [[TID:%.*]] = load i32, i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_REGION:%.*]]
 | |
| ; CHECK:       omp.par.outlined.exit.exitStub:
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK:       omp.par.region:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_MERGED:%.*]]
 | |
| ; CHECK:       omp.par.merged:
 | |
| ; CHECK-NEXT:    call void @.omp_outlined..22(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB2]], i32 [[OMP_GLOBAL_THREAD_NUM]])
 | |
| ; CHECK-NEXT:    call void @.omp_outlined..23(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM1:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB2]], i32 [[OMP_GLOBAL_THREAD_NUM1]])
 | |
| ; CHECK-NEXT:    call void @.omp_outlined..24(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    br label [[ENTRY_SPLIT:%.*]]
 | |
| ; CHECK:       entry.split:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_REGION_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.region.split:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_PRE_FINALIZE:%.*]]
 | |
| ; CHECK:       omp.par.pre_finalize:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT_EXITSTUB:%.*]]
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..22
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..23
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..24
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@merge_3_seq
 | |
| ; CHECK-SAME: (i32 [[A:%.*]], i32 [[B:%.*]]) local_unnamed_addr {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[ADD1_SEQ_OUTPUT_ALLOC:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    [[ADD_SEQ_OUTPUT_ALLOC:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    [[A_ADDR:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    store i32 [[A]], i32* [[A_ADDR]], align 4
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM7:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    br label [[OMP_PARALLEL:%.*]]
 | |
| ; CHECK:       omp_parallel:
 | |
| ; CHECK-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB1]], i32 3, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*, i32*, i32*)* @merge_3_seq..omp_par to void (i32*, i32*, ...)*), i32* [[A_ADDR]], i32* [[ADD_SEQ_OUTPUT_ALLOC]], i32* [[ADD1_SEQ_OUTPUT_ALLOC]])
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT:%.*]]
 | |
| ; CHECK:       omp.par.outlined.exit:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_EXIT_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.exit.split:
 | |
| ; CHECK-NEXT:    br label [[ENTRY_SPLIT_SPLIT:%.*]]
 | |
| ; CHECK:       entry.split.split:
 | |
| ; CHECK-NEXT:    [[ADD1_SEQ_OUTPUT_LOAD:%.*]] = load i32, i32* [[ADD1_SEQ_OUTPUT_ALLOC]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[ADD1_SEQ_OUTPUT_LOAD]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@merge_3_seq..omp_par
 | |
| ; CHECK-SAME: (i32* noalias [[TID_ADDR:%.*]], i32* noalias [[ZERO_ADDR:%.*]], i32* [[A_ADDR:%.*]], i32* [[ADD_SEQ_OUTPUT_ALLOC:%.*]], i32* [[ADD1_SEQ_OUTPUT_ALLOC:%.*]]) #[[ATTR0]] {
 | |
| ; CHECK-NEXT:  omp.par.entry:
 | |
| ; CHECK-NEXT:    [[TID_ADDR_LOCAL:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[TID_ADDR]], align 4
 | |
| ; CHECK-NEXT:    store i32 [[TMP0]], i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK-NEXT:    [[TID:%.*]] = load i32, i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_REGION:%.*]]
 | |
| ; CHECK:       omp.par.outlined.exit.exitStub:
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK:       omp.par.region:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_MERGED:%.*]]
 | |
| ; CHECK:       omp.par.merged:
 | |
| ; CHECK-NEXT:    call void @.omp_outlined..25(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM2:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB2]], i32 [[OMP_GLOBAL_THREAD_NUM2]])
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    [[TMP1:%.*]] = call i32 @__kmpc_master(%struct.ident_t* @[[GLOB1]], i32 [[OMP_GLOBAL_THREAD_NUM]])
 | |
| ; CHECK-NEXT:    [[TMP2:%.*]] = icmp ne i32 [[TMP1]], 0
 | |
| ; CHECK-NEXT:    br i1 [[TMP2]], label [[OMP_REGION_BODY:%.*]], label [[OMP_REGION_END:%.*]]
 | |
| ; CHECK:       omp_region.end:
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM1:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB2]], i32 [[OMP_GLOBAL_THREAD_NUM1]])
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_MERGED_SPLIT_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.merged.split.split:
 | |
| ; CHECK-NEXT:    call void @.omp_outlined..26(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM4:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB2]], i32 [[OMP_GLOBAL_THREAD_NUM4]])
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM3:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    [[TMP3:%.*]] = call i32 @__kmpc_master(%struct.ident_t* @[[GLOB1]], i32 [[OMP_GLOBAL_THREAD_NUM3]])
 | |
| ; CHECK-NEXT:    [[TMP4:%.*]] = icmp ne i32 [[TMP3]], 0
 | |
| ; CHECK-NEXT:    br i1 [[TMP4]], label [[OMP_REGION_BODY5:%.*]], label [[OMP_REGION_END4:%.*]]
 | |
| ; CHECK:       omp_region.end4:
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM6:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB2]], i32 [[OMP_GLOBAL_THREAD_NUM6]])
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_MERGED_SPLIT_SPLIT_SPLIT_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.merged.split.split.split.split:
 | |
| ; CHECK-NEXT:    call void @.omp_outlined..27(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    br label [[ENTRY_SPLIT:%.*]]
 | |
| ; CHECK:       entry.split:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_REGION_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.region.split:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_PRE_FINALIZE:%.*]]
 | |
| ; CHECK:       omp.par.pre_finalize:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT_EXITSTUB:%.*]]
 | |
| ; CHECK:       omp_region.body5:
 | |
| ; CHECK-NEXT:    br label [[SEQ_PAR_MERGED2:%.*]]
 | |
| ; CHECK:       seq.par.merged2:
 | |
| ; CHECK-NEXT:    [[TMP5:%.*]] = load i32, i32* [[A_ADDR]], align 4
 | |
| ; CHECK-NEXT:    [[ADD_SEQ_OUTPUT_LOAD:%.*]] = load i32, i32* [[ADD_SEQ_OUTPUT_ALLOC]], align 4
 | |
| ; CHECK-NEXT:    [[ADD1:%.*]] = add nsw i32 [[ADD_SEQ_OUTPUT_LOAD]], [[TMP5]]
 | |
| ; CHECK-NEXT:    store i32 [[ADD1]], i32* [[ADD1_SEQ_OUTPUT_ALLOC]], align 4
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_MERGED_SPLIT_SPLIT_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.merged.split.split.split:
 | |
| ; CHECK-NEXT:    br label [[OMP_REGION_BODY5_SPLIT:%.*]]
 | |
| ; CHECK:       omp_region.body5.split:
 | |
| ; CHECK-NEXT:    call void @__kmpc_end_master(%struct.ident_t* @[[GLOB1]], i32 [[OMP_GLOBAL_THREAD_NUM3]])
 | |
| ; CHECK-NEXT:    br label [[OMP_REGION_END4]]
 | |
| ; CHECK:       omp_region.body:
 | |
| ; CHECK-NEXT:    br label [[SEQ_PAR_MERGED:%.*]]
 | |
| ; CHECK:       seq.par.merged:
 | |
| ; CHECK-NEXT:    [[TMP6:%.*]] = load i32, i32* [[A_ADDR]], align 4
 | |
| ; CHECK-NEXT:    [[ADD:%.*]] = add nsw i32 [[TMP6]], 1
 | |
| ; CHECK-NEXT:    store i32 [[ADD]], i32* [[ADD_SEQ_OUTPUT_ALLOC]], align 4
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_MERGED_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.merged.split:
 | |
| ; CHECK-NEXT:    br label [[OMP_REGION_BODY_SPLIT:%.*]]
 | |
| ; CHECK:       omp_region.body.split:
 | |
| ; CHECK-NEXT:    call void @__kmpc_end_master(%struct.ident_t* @[[GLOB1]], i32 [[OMP_GLOBAL_THREAD_NUM]])
 | |
| ; CHECK-NEXT:    br label [[OMP_REGION_END]]
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..25
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..26
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..27
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@unmergable_3_seq_call
 | |
| ; CHECK-SAME: (i32 [[A:%.*]]) local_unnamed_addr {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[A_ADDR:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    store i32 [[A]], i32* [[A_ADDR]], align 4
 | |
| ; CHECK-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]], i32 noundef 1, void (i32*, i32*, ...)* noundef bitcast (void (i32*, i32*, i32*)* @.omp_outlined..28 to void (i32*, i32*, ...)*), i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    call void (...) @foo()
 | |
| ; CHECK-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]], i32 noundef 1, void (i32*, i32*, ...)* noundef bitcast (void (i32*, i32*, i32*)* @.omp_outlined..29 to void (i32*, i32*, ...)*), i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    call void (...) @foo()
 | |
| ; CHECK-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]], i32 noundef 1, void (i32*, i32*, ...)* noundef bitcast (void (i32*, i32*, i32*)* @.omp_outlined..30 to void (i32*, i32*, ...)*), i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..28
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..29
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..30
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@unmergable_3_proc_bind
 | |
| ; CHECK-SAME: (i32 [[A:%.*]]) local_unnamed_addr {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[A_ADDR:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]])
 | |
| ; CHECK-NEXT:    store i32 [[A]], i32* [[A_ADDR]], align 4
 | |
| ; CHECK-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]], i32 noundef 1, void (i32*, i32*, ...)* noundef bitcast (void (i32*, i32*, i32*)* @.omp_outlined..31 to void (i32*, i32*, ...)*), i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    call void @__kmpc_push_proc_bind(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]], i32 [[TMP0]], i32 noundef 3)
 | |
| ; CHECK-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]], i32 noundef 1, void (i32*, i32*, ...)* noundef bitcast (void (i32*, i32*, i32*)* @.omp_outlined..32 to void (i32*, i32*, ...)*), i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]], i32 noundef 1, void (i32*, i32*, ...)* noundef bitcast (void (i32*, i32*, i32*)* @.omp_outlined..33 to void (i32*, i32*, ...)*), i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..31
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..32
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..33
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@unmergable_3_num_threads
 | |
| ; CHECK-SAME: (i32 [[A:%.*]]) local_unnamed_addr {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[A_ADDR:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]])
 | |
| ; CHECK-NEXT:    store i32 [[A]], i32* [[A_ADDR]], align 4
 | |
| ; CHECK-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]], i32 noundef 1, void (i32*, i32*, ...)* noundef bitcast (void (i32*, i32*, i32*)* @.omp_outlined..34 to void (i32*, i32*, ...)*), i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    [[TMP1:%.*]] = load i32, i32* [[A_ADDR]], align 4
 | |
| ; CHECK-NEXT:    call void @__kmpc_push_num_threads(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]], i32 [[TMP0]], i32 [[TMP1]])
 | |
| ; CHECK-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]], i32 noundef 1, void (i32*, i32*, ...)* noundef bitcast (void (i32*, i32*, i32*)* @.omp_outlined..35 to void (i32*, i32*, ...)*), i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]], i32 noundef 1, void (i32*, i32*, ...)* noundef bitcast (void (i32*, i32*, i32*)* @.omp_outlined..36 to void (i32*, i32*, ...)*), i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..34
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..35
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..36
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@merge_2_unmergable_1
 | |
| ; CHECK-SAME: (i32 [[A:%.*]]) local_unnamed_addr {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[A_ADDR:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    store i32 [[A]], i32* [[A_ADDR]], align 4
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    br label [[OMP_PARALLEL:%.*]]
 | |
| ; CHECK:       omp_parallel:
 | |
| ; CHECK-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB1]], i32 1, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*)* @merge_2_unmergable_1..omp_par to void (i32*, i32*, ...)*), i32* [[A_ADDR]])
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT:%.*]]
 | |
| ; CHECK:       omp.par.outlined.exit:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_EXIT_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.exit.split:
 | |
| ; CHECK-NEXT:    br label [[ENTRY_SPLIT_SPLIT:%.*]]
 | |
| ; CHECK:       entry.split.split:
 | |
| ; CHECK-NEXT:    call void (...) @foo()
 | |
| ; CHECK-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]], i32 noundef 1, void (i32*, i32*, ...)* noundef bitcast (void (i32*, i32*, i32*)* @.omp_outlined..39 to void (i32*, i32*, ...)*), i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@merge_2_unmergable_1..omp_par
 | |
| ; CHECK-SAME: (i32* noalias [[TID_ADDR:%.*]], i32* noalias [[ZERO_ADDR:%.*]], i32* [[A_ADDR:%.*]]) #[[ATTR0]] {
 | |
| ; CHECK-NEXT:  omp.par.entry:
 | |
| ; CHECK-NEXT:    [[TID_ADDR_LOCAL:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[TID_ADDR]], align 4
 | |
| ; CHECK-NEXT:    store i32 [[TMP0]], i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK-NEXT:    [[TID:%.*]] = load i32, i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_REGION:%.*]]
 | |
| ; CHECK:       omp.par.outlined.exit.exitStub:
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK:       omp.par.region:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_MERGED:%.*]]
 | |
| ; CHECK:       omp.par.merged:
 | |
| ; CHECK-NEXT:    call void @.omp_outlined..37(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB2]], i32 [[OMP_GLOBAL_THREAD_NUM]])
 | |
| ; CHECK-NEXT:    call void @.omp_outlined..38(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    br label [[ENTRY_SPLIT:%.*]]
 | |
| ; CHECK:       entry.split:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_REGION_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.region.split:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_PRE_FINALIZE:%.*]]
 | |
| ; CHECK:       omp.par.pre_finalize:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT_EXITSTUB:%.*]]
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..37
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..38
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..39
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@merge
 | |
| ; CHECK-SAME: (i32 [[A:%.*]]) local_unnamed_addr {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[A_ADDR:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    store i32 [[A]], i32* [[A_ADDR]], align 4
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    br label [[OMP_PARALLEL:%.*]]
 | |
| ; CHECK:       omp_parallel:
 | |
| ; CHECK-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB1]], i32 1, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*)* @merge..omp_par to void (i32*, i32*, ...)*), i32* [[A_ADDR]])
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT:%.*]]
 | |
| ; CHECK:       omp.par.outlined.exit:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_EXIT_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.exit.split:
 | |
| ; CHECK-NEXT:    br label [[ENTRY_SPLIT_SPLIT:%.*]]
 | |
| ; CHECK:       entry.split.split:
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@merge..omp_par
 | |
| ; CHECK-SAME: (i32* noalias [[TID_ADDR:%.*]], i32* noalias [[ZERO_ADDR:%.*]], i32* [[A_ADDR:%.*]]) #[[ATTR0]] {
 | |
| ; CHECK-NEXT:  omp.par.entry:
 | |
| ; CHECK-NEXT:    [[TID_ADDR_LOCAL:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[TID_ADDR]], align 4
 | |
| ; CHECK-NEXT:    store i32 [[TMP0]], i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK-NEXT:    [[TID:%.*]] = load i32, i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_REGION:%.*]]
 | |
| ; CHECK:       omp.par.outlined.exit.exitStub:
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK:       omp.par.region:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_MERGED:%.*]]
 | |
| ; CHECK:       omp.par.merged:
 | |
| ; CHECK-NEXT:    call void @.omp_outlined.(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB2]], i32 [[OMP_GLOBAL_THREAD_NUM]])
 | |
| ; CHECK-NEXT:    call void @.omp_outlined..1(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    br label [[ENTRY_SPLIT:%.*]]
 | |
| ; CHECK:       entry.split:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_REGION_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.region.split:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_PRE_FINALIZE:%.*]]
 | |
| ; CHECK:       omp.par.pre_finalize:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT_EXITSTUB:%.*]]
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined.
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..1
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@unmergable_proc_bind
 | |
| ; CHECK-SAME: (i32 [[A:%.*]]) local_unnamed_addr {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[A_ADDR:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]])
 | |
| ; CHECK-NEXT:    store i32 [[A]], i32* [[A_ADDR]], align 4
 | |
| ; CHECK-NEXT:    call void @__kmpc_push_proc_bind(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]], i32 [[TMP0]], i32 noundef 3)
 | |
| ; CHECK-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]], i32 noundef 1, void (i32*, i32*, ...)* noundef bitcast (void (i32*, i32*, i32*)* @.omp_outlined..2 to void (i32*, i32*, ...)*), i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]], i32 noundef 1, void (i32*, i32*, ...)* noundef bitcast (void (i32*, i32*, i32*)* @.omp_outlined..3 to void (i32*, i32*, ...)*), i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..2
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..3
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@unmergable_num_threads
 | |
| ; CHECK-SAME: (i32 [[A:%.*]]) local_unnamed_addr {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[A_ADDR:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]])
 | |
| ; CHECK-NEXT:    store i32 [[A]], i32* [[A_ADDR]], align 4
 | |
| ; CHECK-NEXT:    call void @__kmpc_push_num_threads(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]], i32 [[TMP0]], i32 [[A]])
 | |
| ; CHECK-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]], i32 noundef 1, void (i32*, i32*, ...)* noundef bitcast (void (i32*, i32*, i32*)* @.omp_outlined..4 to void (i32*, i32*, ...)*), i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]], i32 noundef 1, void (i32*, i32*, ...)* noundef bitcast (void (i32*, i32*, i32*)* @.omp_outlined..5 to void (i32*, i32*, ...)*), i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..4
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..5
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@unmergable_seq_call
 | |
| ; CHECK-SAME: (i32 [[A:%.*]]) local_unnamed_addr {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[A_ADDR:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    store i32 [[A]], i32* [[A_ADDR]], align 4
 | |
| ; CHECK-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]], i32 noundef 1, void (i32*, i32*, ...)* noundef bitcast (void (i32*, i32*, i32*)* @.omp_outlined..6 to void (i32*, i32*, ...)*), i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    call void (...) @foo()
 | |
| ; CHECK-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]], i32 noundef 1, void (i32*, i32*, ...)* noundef bitcast (void (i32*, i32*, i32*)* @.omp_outlined..7 to void (i32*, i32*, ...)*), i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..6
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..7
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@merge_seq
 | |
| ; CHECK-SAME: (i32 [[A:%.*]]) local_unnamed_addr {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[A_ADDR:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    store i32 [[A]], i32* [[A_ADDR]], align 4
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM2:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    br label [[OMP_PARALLEL:%.*]]
 | |
| ; CHECK:       omp_parallel:
 | |
| ; CHECK-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB1]], i32 1, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*)* @merge_seq..omp_par to void (i32*, i32*, ...)*), i32* [[A_ADDR]])
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT:%.*]]
 | |
| ; CHECK:       omp.par.outlined.exit:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_EXIT_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.exit.split:
 | |
| ; CHECK-NEXT:    br label [[ENTRY_SPLIT_SPLIT:%.*]]
 | |
| ; CHECK:       entry.split.split:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A_ADDR]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@merge_seq..omp_par
 | |
| ; CHECK-SAME: (i32* noalias [[TID_ADDR:%.*]], i32* noalias [[ZERO_ADDR:%.*]], i32* [[A_ADDR:%.*]]) #[[ATTR0]] {
 | |
| ; CHECK-NEXT:  omp.par.entry:
 | |
| ; CHECK-NEXT:    [[TID_ADDR_LOCAL:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[TID_ADDR]], align 4
 | |
| ; CHECK-NEXT:    store i32 [[TMP0]], i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK-NEXT:    [[TID:%.*]] = load i32, i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_REGION:%.*]]
 | |
| ; CHECK:       omp.par.outlined.exit.exitStub:
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK:       omp.par.region:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_MERGED:%.*]]
 | |
| ; CHECK:       omp.par.merged:
 | |
| ; CHECK-NEXT:    call void @.omp_outlined..8(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM2:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB2]], i32 [[OMP_GLOBAL_THREAD_NUM2]])
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    [[TMP1:%.*]] = call i32 @__kmpc_master(%struct.ident_t* @[[GLOB1]], i32 [[OMP_GLOBAL_THREAD_NUM]])
 | |
| ; CHECK-NEXT:    [[TMP2:%.*]] = icmp ne i32 [[TMP1]], 0
 | |
| ; CHECK-NEXT:    br i1 [[TMP2]], label [[OMP_REGION_BODY:%.*]], label [[OMP_REGION_END:%.*]]
 | |
| ; CHECK:       omp_region.end:
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM1:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB2]], i32 [[OMP_GLOBAL_THREAD_NUM1]])
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_MERGED_SPLIT_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.merged.split.split:
 | |
| ; CHECK-NEXT:    call void @.omp_outlined..9(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    br label [[ENTRY_SPLIT:%.*]]
 | |
| ; CHECK:       entry.split:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_REGION_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.region.split:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_PRE_FINALIZE:%.*]]
 | |
| ; CHECK:       omp.par.pre_finalize:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT_EXITSTUB:%.*]]
 | |
| ; CHECK:       omp_region.body:
 | |
| ; CHECK-NEXT:    br label [[SEQ_PAR_MERGED:%.*]]
 | |
| ; CHECK:       seq.par.merged:
 | |
| ; CHECK-NEXT:    [[TMP3:%.*]] = load i32, i32* [[A_ADDR]], align 4
 | |
| ; CHECK-NEXT:    [[ADD:%.*]] = add nsw i32 [[TMP3]], 1
 | |
| ; CHECK-NEXT:    store i32 [[ADD]], i32* [[A_ADDR]], align 4
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_MERGED_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.merged.split:
 | |
| ; CHECK-NEXT:    br label [[OMP_REGION_BODY_SPLIT:%.*]]
 | |
| ; CHECK:       omp_region.body.split:
 | |
| ; CHECK-NEXT:    call void @__kmpc_end_master(%struct.ident_t* @[[GLOB1]], i32 [[OMP_GLOBAL_THREAD_NUM]])
 | |
| ; CHECK-NEXT:    br label [[OMP_REGION_END]]
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..8
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..9
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@merge_seq_float
 | |
| ; CHECK-SAME: (float [[F:%.*]], float* nocapture nofree writeonly [[P:%.*]]) local_unnamed_addr {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[F_ADDR:%.*]] = alloca float, align 4
 | |
| ; CHECK-NEXT:    store float [[F]], float* [[F_ADDR]], align 4
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM2:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    br label [[OMP_PARALLEL:%.*]]
 | |
| ; CHECK:       omp_parallel:
 | |
| ; CHECK-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB1]], i32 2, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, float*, float*)* @merge_seq_float..omp_par to void (i32*, i32*, ...)*), float* [[F_ADDR]], float* [[P]])
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT:%.*]]
 | |
| ; CHECK:       omp.par.outlined.exit:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_EXIT_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.exit.split:
 | |
| ; CHECK-NEXT:    br label [[ENTRY_SPLIT_SPLIT:%.*]]
 | |
| ; CHECK:       entry.split.split:
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@merge_seq_float..omp_par
 | |
| ; CHECK-SAME: (i32* noalias [[TID_ADDR:%.*]], i32* noalias [[ZERO_ADDR:%.*]], float* [[F_ADDR:%.*]], float* [[P:%.*]]) #[[ATTR0]] {
 | |
| ; CHECK-NEXT:  omp.par.entry:
 | |
| ; CHECK-NEXT:    [[TID_ADDR_LOCAL:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[TID_ADDR]], align 4
 | |
| ; CHECK-NEXT:    store i32 [[TMP0]], i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK-NEXT:    [[TID:%.*]] = load i32, i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_REGION:%.*]]
 | |
| ; CHECK:       omp.par.outlined.exit.exitStub:
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK:       omp.par.region:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_MERGED:%.*]]
 | |
| ; CHECK:       omp.par.merged:
 | |
| ; CHECK-NEXT:    call void @.omp_outlined..10(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], float* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[F_ADDR]])
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM2:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB2]], i32 [[OMP_GLOBAL_THREAD_NUM2]])
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    [[TMP1:%.*]] = call i32 @__kmpc_master(%struct.ident_t* @[[GLOB1]], i32 [[OMP_GLOBAL_THREAD_NUM]])
 | |
| ; CHECK-NEXT:    [[TMP2:%.*]] = icmp ne i32 [[TMP1]], 0
 | |
| ; CHECK-NEXT:    br i1 [[TMP2]], label [[OMP_REGION_BODY:%.*]], label [[OMP_REGION_END:%.*]]
 | |
| ; CHECK:       omp_region.end:
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM1:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB2]], i32 [[OMP_GLOBAL_THREAD_NUM1]])
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_MERGED_SPLIT_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.merged.split.split:
 | |
| ; CHECK-NEXT:    call void @.omp_outlined..11(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], float* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[F_ADDR]])
 | |
| ; CHECK-NEXT:    br label [[ENTRY_SPLIT:%.*]]
 | |
| ; CHECK:       entry.split:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_REGION_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.region.split:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_PRE_FINALIZE:%.*]]
 | |
| ; CHECK:       omp.par.pre_finalize:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT_EXITSTUB:%.*]]
 | |
| ; CHECK:       omp_region.body:
 | |
| ; CHECK-NEXT:    br label [[SEQ_PAR_MERGED:%.*]]
 | |
| ; CHECK:       seq.par.merged:
 | |
| ; CHECK-NEXT:    [[TMP3:%.*]] = load float, float* [[F_ADDR]], align 4
 | |
| ; CHECK-NEXT:    [[ADD:%.*]] = fadd float [[TMP3]], 0x40091EB860000000
 | |
| ; CHECK-NEXT:    store float [[ADD]], float* [[P]], align 4
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_MERGED_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.merged.split:
 | |
| ; CHECK-NEXT:    br label [[OMP_REGION_BODY_SPLIT:%.*]]
 | |
| ; CHECK:       omp_region.body.split:
 | |
| ; CHECK-NEXT:    call void @__kmpc_end_master(%struct.ident_t* @[[GLOB1]], i32 [[OMP_GLOBAL_THREAD_NUM]])
 | |
| ; CHECK-NEXT:    br label [[OMP_REGION_END]]
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..10
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], float* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[F:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load float, float* [[F]], align 4
 | |
| ; CHECK-NEXT:    [[CONV:%.*]] = fptosi float [[TMP0]] to i32
 | |
| ; CHECK-NEXT:    call void @use(i32 [[CONV]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..11
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], float* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[F:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load float, float* [[F]], align 4
 | |
| ; CHECK-NEXT:    [[CONV:%.*]] = fptosi float [[TMP0]] to i32
 | |
| ; CHECK-NEXT:    call void @use(i32 [[CONV]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@merge_seq_firstprivate
 | |
| ; CHECK-SAME: (i32 [[A:%.*]]) local_unnamed_addr {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[A_CASTED_SROA_0_0_INSERT_EXT_SEQ_OUTPUT_ALLOC:%.*]] = alloca i64, align 8
 | |
| ; CHECK-NEXT:    [[A_ADDR:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    store i32 [[A]], i32* [[A_ADDR]], align 4
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM2:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    br label [[OMP_PARALLEL:%.*]]
 | |
| ; CHECK:       omp_parallel:
 | |
| ; CHECK-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB1]], i32 2, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*, i64*)* @merge_seq_firstprivate..omp_par to void (i32*, i32*, ...)*), i32* [[A_ADDR]], i64* [[A_CASTED_SROA_0_0_INSERT_EXT_SEQ_OUTPUT_ALLOC]])
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT:%.*]]
 | |
| ; CHECK:       omp.par.outlined.exit:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_EXIT_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.exit.split:
 | |
| ; CHECK-NEXT:    br label [[ENTRY_SPLIT_SPLIT:%.*]]
 | |
| ; CHECK:       entry.split.split:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A_ADDR]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@merge_seq_firstprivate..omp_par
 | |
| ; CHECK-SAME: (i32* noalias [[TID_ADDR:%.*]], i32* noalias [[ZERO_ADDR:%.*]], i32* [[A_ADDR:%.*]], i64* [[A_CASTED_SROA_0_0_INSERT_EXT_SEQ_OUTPUT_ALLOC:%.*]]) #[[ATTR0]] {
 | |
| ; CHECK-NEXT:  omp.par.entry:
 | |
| ; CHECK-NEXT:    [[TID_ADDR_LOCAL:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[TID_ADDR]], align 4
 | |
| ; CHECK-NEXT:    store i32 [[TMP0]], i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK-NEXT:    [[TID:%.*]] = load i32, i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_REGION:%.*]]
 | |
| ; CHECK:       omp.par.outlined.exit.exitStub:
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK:       omp.par.region:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_MERGED:%.*]]
 | |
| ; CHECK:       omp.par.merged:
 | |
| ; CHECK-NEXT:    call void @.omp_outlined..12(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM2:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB2]], i32 [[OMP_GLOBAL_THREAD_NUM2]])
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    [[TMP1:%.*]] = call i32 @__kmpc_master(%struct.ident_t* @[[GLOB1]], i32 [[OMP_GLOBAL_THREAD_NUM]])
 | |
| ; CHECK-NEXT:    [[TMP2:%.*]] = icmp ne i32 [[TMP1]], 0
 | |
| ; CHECK-NEXT:    br i1 [[TMP2]], label [[OMP_REGION_BODY:%.*]], label [[OMP_REGION_END:%.*]]
 | |
| ; CHECK:       omp_region.end:
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM1:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB2]], i32 [[OMP_GLOBAL_THREAD_NUM1]])
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_MERGED_SPLIT_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.merged.split.split:
 | |
| ; CHECK-NEXT:    [[A_CASTED_SROA_0_0_INSERT_EXT_SEQ_OUTPUT_LOAD:%.*]] = load i64, i64* [[A_CASTED_SROA_0_0_INSERT_EXT_SEQ_OUTPUT_ALLOC]], align 8
 | |
| ; CHECK-NEXT:    call void @.omp_outlined..13(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i64 [[A_CASTED_SROA_0_0_INSERT_EXT_SEQ_OUTPUT_LOAD]])
 | |
| ; CHECK-NEXT:    br label [[ENTRY_SPLIT:%.*]]
 | |
| ; CHECK:       entry.split:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_REGION_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.region.split:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_PRE_FINALIZE:%.*]]
 | |
| ; CHECK:       omp.par.pre_finalize:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT_EXITSTUB:%.*]]
 | |
| ; CHECK:       omp_region.body:
 | |
| ; CHECK-NEXT:    br label [[SEQ_PAR_MERGED:%.*]]
 | |
| ; CHECK:       seq.par.merged:
 | |
| ; CHECK-NEXT:    [[TMP3:%.*]] = load i32, i32* [[A_ADDR]], align 4
 | |
| ; CHECK-NEXT:    [[ADD:%.*]] = add nsw i32 [[TMP3]], 1
 | |
| ; CHECK-NEXT:    store i32 [[ADD]], i32* [[A_ADDR]], align 4
 | |
| ; CHECK-NEXT:    [[A_CASTED_SROA_0_0_INSERT_EXT:%.*]] = zext i32 [[ADD]] to i64
 | |
| ; CHECK-NEXT:    store i64 [[A_CASTED_SROA_0_0_INSERT_EXT]], i64* [[A_CASTED_SROA_0_0_INSERT_EXT_SEQ_OUTPUT_ALLOC]], align 8
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_MERGED_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.merged.split:
 | |
| ; CHECK-NEXT:    br label [[OMP_REGION_BODY_SPLIT:%.*]]
 | |
| ; CHECK:       omp_region.body.split:
 | |
| ; CHECK-NEXT:    call void @__kmpc_end_master(%struct.ident_t* @[[GLOB1]], i32 [[OMP_GLOBAL_THREAD_NUM]])
 | |
| ; CHECK-NEXT:    br label [[OMP_REGION_END]]
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..12
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..13
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i64 [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[A_ADDR_SROA_0_0_EXTRACT_TRUNC:%.*]] = trunc i64 [[A]] to i32
 | |
| ; CHECK-NEXT:    call void @use(i32 [[A_ADDR_SROA_0_0_EXTRACT_TRUNC]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@merge_seq_sink_lt
 | |
| ; CHECK-SAME: (i32 [[A:%.*]]) local_unnamed_addr {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[A_ADDR:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    store i32 [[A]], i32* [[A_ADDR]], align 4
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM2:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    br label [[OMP_PARALLEL:%.*]]
 | |
| ; CHECK:       omp_parallel:
 | |
| ; CHECK-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB1]], i32 1, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*)* @merge_seq_sink_lt..omp_par to void (i32*, i32*, ...)*), i32* [[A_ADDR]])
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT:%.*]]
 | |
| ; CHECK:       omp.par.outlined.exit:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_EXIT_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.exit.split:
 | |
| ; CHECK-NEXT:    br label [[ENTRY_SPLIT_SPLIT:%.*]]
 | |
| ; CHECK:       entry.split.split:
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@merge_seq_sink_lt..omp_par
 | |
| ; CHECK-SAME: (i32* noalias [[TID_ADDR:%.*]], i32* noalias [[ZERO_ADDR:%.*]], i32* [[A_ADDR:%.*]]) #[[ATTR0]] {
 | |
| ; CHECK-NEXT:  omp.par.entry:
 | |
| ; CHECK-NEXT:    [[B:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    [[TID_ADDR_LOCAL:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[TID_ADDR]], align 4
 | |
| ; CHECK-NEXT:    store i32 [[TMP0]], i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK-NEXT:    [[TID:%.*]] = load i32, i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_REGION:%.*]]
 | |
| ; CHECK:       omp.par.outlined.exit.exitStub:
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK:       omp.par.region:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_MERGED:%.*]]
 | |
| ; CHECK:       omp.par.merged:
 | |
| ; CHECK-NEXT:    call void @.omp_outlined..14(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM2:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB2]], i32 [[OMP_GLOBAL_THREAD_NUM2]])
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    [[TMP1:%.*]] = call i32 @__kmpc_master(%struct.ident_t* @[[GLOB1]], i32 [[OMP_GLOBAL_THREAD_NUM]])
 | |
| ; CHECK-NEXT:    [[TMP2:%.*]] = icmp ne i32 [[TMP1]], 0
 | |
| ; CHECK-NEXT:    br i1 [[TMP2]], label [[OMP_REGION_BODY:%.*]], label [[OMP_REGION_END:%.*]]
 | |
| ; CHECK:       omp_region.end:
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM1:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB2]], i32 [[OMP_GLOBAL_THREAD_NUM1]])
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_MERGED_SPLIT_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.merged.split.split:
 | |
| ; CHECK-NEXT:    call void @.omp_outlined..15(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    br label [[ENTRY_SPLIT:%.*]]
 | |
| ; CHECK:       entry.split:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_REGION_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.region.split:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_PRE_FINALIZE:%.*]]
 | |
| ; CHECK:       omp.par.pre_finalize:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT_EXITSTUB:%.*]]
 | |
| ; CHECK:       omp_region.body:
 | |
| ; CHECK-NEXT:    br label [[SEQ_PAR_MERGED:%.*]]
 | |
| ; CHECK:       seq.par.merged:
 | |
| ; CHECK-NEXT:    [[TMP3:%.*]] = bitcast i32* [[B]] to i8*
 | |
| ; CHECK-NEXT:    call void @llvm.lifetime.start.p0i8(i64 noundef 4, i8* noundef nonnull [[TMP3]])
 | |
| ; CHECK-NEXT:    [[TMP4:%.*]] = ptrtoint i32* [[B]] to i64
 | |
| ; CHECK-NEXT:    [[TMP5:%.*]] = trunc i64 [[TMP4]] to i32
 | |
| ; CHECK-NEXT:    store i32 [[TMP5]], i32* [[B]], align 4
 | |
| ; CHECK-NEXT:    call void @llvm.lifetime.end.p0i8(i64 noundef 4, i8* noundef nonnull [[TMP3]])
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_MERGED_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.merged.split:
 | |
| ; CHECK-NEXT:    br label [[OMP_REGION_BODY_SPLIT:%.*]]
 | |
| ; CHECK:       omp_region.body.split:
 | |
| ; CHECK-NEXT:    call void @__kmpc_end_master(%struct.ident_t* @[[GLOB1]], i32 [[OMP_GLOBAL_THREAD_NUM]])
 | |
| ; CHECK-NEXT:    br label [[OMP_REGION_END]]
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..14
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..15
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@merge_seq_par_use
 | |
| ; CHECK-SAME: (i32 [[A:%.*]]) local_unnamed_addr {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[A_ADDR:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    [[B:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    store i32 [[A]], i32* [[A_ADDR]], align 4
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM2:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    br label [[OMP_PARALLEL:%.*]]
 | |
| ; CHECK:       omp_parallel:
 | |
| ; CHECK-NEXT:    [[LT_CAST3:%.*]] = bitcast i32* [[B]] to i8*
 | |
| ; CHECK-NEXT:    call void @llvm.lifetime.start.p0i8(i64 -1, i8* [[LT_CAST3]])
 | |
| ; CHECK-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB1]], i32 2, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*, i32*)* @merge_seq_par_use..omp_par to void (i32*, i32*, ...)*), i32* [[A_ADDR]], i32* [[B]])
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT:%.*]]
 | |
| ; CHECK:       omp.par.outlined.exit:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_EXIT_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.exit.split:
 | |
| ; CHECK-NEXT:    br label [[ENTRY_SPLIT_SPLIT:%.*]]
 | |
| ; CHECK:       entry.split.split:
 | |
| ; CHECK-NEXT:    [[LT_CAST:%.*]] = bitcast i32* [[B]] to i8*
 | |
| ; CHECK-NEXT:    call void @llvm.lifetime.end.p0i8(i64 noundef 4, i8* noundef nonnull [[LT_CAST]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@merge_seq_par_use..omp_par
 | |
| ; CHECK-SAME: (i32* noalias [[TID_ADDR:%.*]], i32* noalias [[ZERO_ADDR:%.*]], i32* [[A_ADDR:%.*]], i32* [[B:%.*]]) #[[ATTR0]] {
 | |
| ; CHECK-NEXT:  omp.par.entry:
 | |
| ; CHECK-NEXT:    [[TID_ADDR_LOCAL:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[TID_ADDR]], align 4
 | |
| ; CHECK-NEXT:    store i32 [[TMP0]], i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK-NEXT:    [[TID:%.*]] = load i32, i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_REGION:%.*]]
 | |
| ; CHECK:       omp.par.outlined.exit.exitStub:
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK:       omp.par.region:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_MERGED:%.*]]
 | |
| ; CHECK:       omp.par.merged:
 | |
| ; CHECK-NEXT:    call void @.omp_outlined..16(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM2:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB2]], i32 [[OMP_GLOBAL_THREAD_NUM2]])
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    [[TMP1:%.*]] = call i32 @__kmpc_master(%struct.ident_t* @[[GLOB1]], i32 [[OMP_GLOBAL_THREAD_NUM]])
 | |
| ; CHECK-NEXT:    [[TMP2:%.*]] = icmp ne i32 [[TMP1]], 0
 | |
| ; CHECK-NEXT:    br i1 [[TMP2]], label [[OMP_REGION_BODY:%.*]], label [[OMP_REGION_END:%.*]]
 | |
| ; CHECK:       omp_region.end:
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM1:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB2]], i32 [[OMP_GLOBAL_THREAD_NUM1]])
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_MERGED_SPLIT_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.merged.split.split:
 | |
| ; CHECK-NEXT:    call void @.omp_outlined..17(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[B]])
 | |
| ; CHECK-NEXT:    br label [[ENTRY_SPLIT:%.*]]
 | |
| ; CHECK:       entry.split:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_REGION_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.region.split:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_PRE_FINALIZE:%.*]]
 | |
| ; CHECK:       omp.par.pre_finalize:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT_EXITSTUB:%.*]]
 | |
| ; CHECK:       omp_region.body:
 | |
| ; CHECK-NEXT:    br label [[SEQ_PAR_MERGED:%.*]]
 | |
| ; CHECK:       seq.par.merged:
 | |
| ; CHECK-NEXT:    [[TMP3:%.*]] = bitcast i32* [[B]] to i8*
 | |
| ; CHECK-NEXT:    [[TMP4:%.*]] = load i32, i32* [[A_ADDR]], align 4
 | |
| ; CHECK-NEXT:    [[ADD:%.*]] = add nsw i32 [[TMP4]], 1
 | |
| ; CHECK-NEXT:    store i32 [[ADD]], i32* [[B]], align 4
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_MERGED_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.merged.split:
 | |
| ; CHECK-NEXT:    br label [[OMP_REGION_BODY_SPLIT:%.*]]
 | |
| ; CHECK:       omp_region.body.split:
 | |
| ; CHECK-NEXT:    call void @__kmpc_end_master(%struct.ident_t* @[[GLOB1]], i32 [[OMP_GLOBAL_THREAD_NUM]])
 | |
| ; CHECK-NEXT:    br label [[OMP_REGION_END]]
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..16
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..17
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[B:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    [[TMP1:%.*]] = load i32, i32* [[B]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP1]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@merge_cancellable_regions
 | |
| ; CHECK-SAME: (i32 [[CANCEL1:%.*]], i32 [[CANCEL2:%.*]]) local_unnamed_addr {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[CANCEL1_ADDR:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    [[CANCEL2_ADDR:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    store i32 [[CANCEL1]], i32* [[CANCEL1_ADDR]], align 4
 | |
| ; CHECK-NEXT:    store i32 [[CANCEL2]], i32* [[CANCEL2_ADDR]], align 4
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    br label [[OMP_PARALLEL:%.*]]
 | |
| ; CHECK:       omp_parallel:
 | |
| ; CHECK-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB1]], i32 2, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*, i32*)* @merge_cancellable_regions..omp_par to void (i32*, i32*, ...)*), i32* [[CANCEL1_ADDR]], i32* [[CANCEL2_ADDR]])
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT:%.*]]
 | |
| ; CHECK:       omp.par.outlined.exit:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_EXIT_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.exit.split:
 | |
| ; CHECK-NEXT:    br label [[ENTRY_SPLIT_SPLIT:%.*]]
 | |
| ; CHECK:       entry.split.split:
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@merge_cancellable_regions..omp_par
 | |
| ; CHECK-SAME: (i32* noalias [[TID_ADDR:%.*]], i32* noalias [[ZERO_ADDR:%.*]], i32* [[CANCEL1_ADDR:%.*]], i32* [[CANCEL2_ADDR:%.*]]) #[[ATTR0]] {
 | |
| ; CHECK-NEXT:  omp.par.entry:
 | |
| ; CHECK-NEXT:    [[TID_ADDR_LOCAL:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[TID_ADDR]], align 4
 | |
| ; CHECK-NEXT:    store i32 [[TMP0]], i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK-NEXT:    [[TID:%.*]] = load i32, i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_REGION:%.*]]
 | |
| ; CHECK:       omp.par.outlined.exit.exitStub:
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK:       omp.par.region:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_MERGED:%.*]]
 | |
| ; CHECK:       omp.par.merged:
 | |
| ; CHECK-NEXT:    call void @.omp_outlined..18(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[CANCEL1_ADDR]])
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB2]], i32 [[OMP_GLOBAL_THREAD_NUM]])
 | |
| ; CHECK-NEXT:    call void @.omp_outlined..19(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[CANCEL2_ADDR]])
 | |
| ; CHECK-NEXT:    br label [[ENTRY_SPLIT:%.*]]
 | |
| ; CHECK:       entry.split:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_REGION_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.region.split:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_PRE_FINALIZE:%.*]]
 | |
| ; CHECK:       omp.par.pre_finalize:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT_EXITSTUB:%.*]]
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..18
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readonly [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[CANCEL1:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[CANCEL1]], align 4
 | |
| ; CHECK-NEXT:    [[TOBOOL_NOT:%.*]] = icmp eq i32 [[TMP0]], 0
 | |
| ; CHECK-NEXT:    br i1 [[TOBOOL_NOT]], label [[IF_END:%.*]], label [[IF_THEN:%.*]]
 | |
| ; CHECK:       if.then:
 | |
| ; CHECK-NEXT:    [[TMP1:%.*]] = load i32, i32* [[DOTGLOBAL_TID_]], align 4
 | |
| ; CHECK-NEXT:    [[TMP2:%.*]] = call i32 @__kmpc_cancel(%struct.ident_t* noundef nonnull @[[GLOB1]], i32 [[TMP1]], i32 noundef 1)
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK:       if.end:
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..19
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readonly [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[CANCEL2:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[CANCEL2]], align 4
 | |
| ; CHECK-NEXT:    [[TOBOOL_NOT:%.*]] = icmp eq i32 [[TMP0]], 0
 | |
| ; CHECK-NEXT:    br i1 [[TOBOOL_NOT]], label [[IF_END:%.*]], label [[IF_THEN:%.*]]
 | |
| ; CHECK:       if.then:
 | |
| ; CHECK-NEXT:    [[TMP1:%.*]] = load i32, i32* [[DOTGLOBAL_TID_]], align 4
 | |
| ; CHECK-NEXT:    [[TMP2:%.*]] = call i32 @__kmpc_cancel(%struct.ident_t* noundef nonnull @[[GLOB1]], i32 [[TMP1]], i32 noundef 1)
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK:       if.end:
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@merge_cancellable_regions_seq
 | |
| ; CHECK-SAME: (i32 [[CANCEL1:%.*]], i32 [[CANCEL2:%.*]]) local_unnamed_addr {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[CANCEL1_ADDR:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    [[CANCEL2_ADDR:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    store i32 [[CANCEL1]], i32* [[CANCEL1_ADDR]], align 4
 | |
| ; CHECK-NEXT:    store i32 [[CANCEL2]], i32* [[CANCEL2_ADDR]], align 4
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM2:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    br label [[OMP_PARALLEL:%.*]]
 | |
| ; CHECK:       omp_parallel:
 | |
| ; CHECK-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB1]], i32 2, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*, i32*)* @merge_cancellable_regions_seq..omp_par to void (i32*, i32*, ...)*), i32* [[CANCEL1_ADDR]], i32* [[CANCEL2_ADDR]])
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT:%.*]]
 | |
| ; CHECK:       omp.par.outlined.exit:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_EXIT_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.exit.split:
 | |
| ; CHECK-NEXT:    br label [[ENTRY_SPLIT_SPLIT:%.*]]
 | |
| ; CHECK:       entry.split.split:
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@merge_cancellable_regions_seq..omp_par
 | |
| ; CHECK-SAME: (i32* noalias [[TID_ADDR:%.*]], i32* noalias [[ZERO_ADDR:%.*]], i32* [[CANCEL1_ADDR:%.*]], i32* [[CANCEL2_ADDR:%.*]]) #[[ATTR0]] {
 | |
| ; CHECK-NEXT:  omp.par.entry:
 | |
| ; CHECK-NEXT:    [[TID_ADDR_LOCAL:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[TID_ADDR]], align 4
 | |
| ; CHECK-NEXT:    store i32 [[TMP0]], i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK-NEXT:    [[TID:%.*]] = load i32, i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_REGION:%.*]]
 | |
| ; CHECK:       omp.par.outlined.exit.exitStub:
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK:       omp.par.region:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_MERGED:%.*]]
 | |
| ; CHECK:       omp.par.merged:
 | |
| ; CHECK-NEXT:    call void @.omp_outlined..20(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[CANCEL1_ADDR]])
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM2:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB2]], i32 [[OMP_GLOBAL_THREAD_NUM2]])
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    [[TMP1:%.*]] = call i32 @__kmpc_master(%struct.ident_t* @[[GLOB1]], i32 [[OMP_GLOBAL_THREAD_NUM]])
 | |
| ; CHECK-NEXT:    [[TMP2:%.*]] = icmp ne i32 [[TMP1]], 0
 | |
| ; CHECK-NEXT:    br i1 [[TMP2]], label [[OMP_REGION_BODY:%.*]], label [[OMP_REGION_END:%.*]]
 | |
| ; CHECK:       omp_region.end:
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM1:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB2]], i32 [[OMP_GLOBAL_THREAD_NUM1]])
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_MERGED_SPLIT_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.merged.split.split:
 | |
| ; CHECK-NEXT:    call void @.omp_outlined..21(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[CANCEL2_ADDR]])
 | |
| ; CHECK-NEXT:    br label [[ENTRY_SPLIT:%.*]]
 | |
| ; CHECK:       entry.split:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_REGION_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.region.split:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_PRE_FINALIZE:%.*]]
 | |
| ; CHECK:       omp.par.pre_finalize:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT_EXITSTUB:%.*]]
 | |
| ; CHECK:       omp_region.body:
 | |
| ; CHECK-NEXT:    br label [[SEQ_PAR_MERGED:%.*]]
 | |
| ; CHECK:       seq.par.merged:
 | |
| ; CHECK-NEXT:    [[TMP3:%.*]] = load i32, i32* [[CANCEL1_ADDR]], align 4
 | |
| ; CHECK-NEXT:    [[TOBOOL_NOT:%.*]] = icmp eq i32 [[TMP3]], 0
 | |
| ; CHECK-NEXT:    [[LNOT_EXT:%.*]] = zext i1 [[TOBOOL_NOT]] to i32
 | |
| ; CHECK-NEXT:    store i32 [[LNOT_EXT]], i32* [[CANCEL2_ADDR]], align 4
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_MERGED_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.merged.split:
 | |
| ; CHECK-NEXT:    br label [[OMP_REGION_BODY_SPLIT:%.*]]
 | |
| ; CHECK:       omp_region.body.split:
 | |
| ; CHECK-NEXT:    call void @__kmpc_end_master(%struct.ident_t* @[[GLOB1]], i32 [[OMP_GLOBAL_THREAD_NUM]])
 | |
| ; CHECK-NEXT:    br label [[OMP_REGION_END]]
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..20
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readonly [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[CANCEL1:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[CANCEL1]], align 4
 | |
| ; CHECK-NEXT:    [[TOBOOL_NOT:%.*]] = icmp eq i32 [[TMP0]], 0
 | |
| ; CHECK-NEXT:    br i1 [[TOBOOL_NOT]], label [[IF_END:%.*]], label [[IF_THEN:%.*]]
 | |
| ; CHECK:       if.then:
 | |
| ; CHECK-NEXT:    [[TMP1:%.*]] = load i32, i32* [[DOTGLOBAL_TID_]], align 4
 | |
| ; CHECK-NEXT:    [[TMP2:%.*]] = call i32 @__kmpc_cancel(%struct.ident_t* noundef nonnull @[[GLOB1]], i32 [[TMP1]], i32 noundef 1)
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK:       if.end:
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..21
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readonly [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[CANCEL2:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[CANCEL2]], align 4
 | |
| ; CHECK-NEXT:    [[TOBOOL_NOT:%.*]] = icmp eq i32 [[TMP0]], 0
 | |
| ; CHECK-NEXT:    br i1 [[TOBOOL_NOT]], label [[IF_END:%.*]], label [[IF_THEN:%.*]]
 | |
| ; CHECK:       if.then:
 | |
| ; CHECK-NEXT:    [[TMP1:%.*]] = load i32, i32* [[DOTGLOBAL_TID_]], align 4
 | |
| ; CHECK-NEXT:    [[TMP2:%.*]] = call i32 @__kmpc_cancel(%struct.ident_t* noundef nonnull @[[GLOB1]], i32 [[TMP1]], i32 noundef 1)
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK:       if.end:
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@merge_3
 | |
| ; CHECK-SAME: (i32 [[A:%.*]]) local_unnamed_addr {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[A_ADDR:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    store i32 [[A]], i32* [[A_ADDR]], align 4
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    br label [[OMP_PARALLEL:%.*]]
 | |
| ; CHECK:       omp_parallel:
 | |
| ; CHECK-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB1]], i32 1, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*)* @merge_3..omp_par to void (i32*, i32*, ...)*), i32* [[A_ADDR]])
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT:%.*]]
 | |
| ; CHECK:       omp.par.outlined.exit:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_EXIT_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.exit.split:
 | |
| ; CHECK-NEXT:    br label [[ENTRY_SPLIT_SPLIT:%.*]]
 | |
| ; CHECK:       entry.split.split:
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@merge_3..omp_par
 | |
| ; CHECK-SAME: (i32* noalias [[TID_ADDR:%.*]], i32* noalias [[ZERO_ADDR:%.*]], i32* [[A_ADDR:%.*]]) #[[ATTR0]] {
 | |
| ; CHECK-NEXT:  omp.par.entry:
 | |
| ; CHECK-NEXT:    [[TID_ADDR_LOCAL:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[TID_ADDR]], align 4
 | |
| ; CHECK-NEXT:    store i32 [[TMP0]], i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK-NEXT:    [[TID:%.*]] = load i32, i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_REGION:%.*]]
 | |
| ; CHECK:       omp.par.outlined.exit.exitStub:
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK:       omp.par.region:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_MERGED:%.*]]
 | |
| ; CHECK:       omp.par.merged:
 | |
| ; CHECK-NEXT:    call void @.omp_outlined..22(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB2]], i32 [[OMP_GLOBAL_THREAD_NUM]])
 | |
| ; CHECK-NEXT:    call void @.omp_outlined..23(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM1:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB2]], i32 [[OMP_GLOBAL_THREAD_NUM1]])
 | |
| ; CHECK-NEXT:    call void @.omp_outlined..24(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    br label [[ENTRY_SPLIT:%.*]]
 | |
| ; CHECK:       entry.split:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_REGION_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.region.split:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_PRE_FINALIZE:%.*]]
 | |
| ; CHECK:       omp.par.pre_finalize:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT_EXITSTUB:%.*]]
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..22
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..23
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..24
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@merge_3_seq
 | |
| ; CHECK-SAME: (i32 [[A:%.*]], i32 [[B:%.*]]) local_unnamed_addr {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[ADD1_SEQ_OUTPUT_ALLOC:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    [[ADD_SEQ_OUTPUT_ALLOC:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    [[A_ADDR:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    store i32 [[A]], i32* [[A_ADDR]], align 4
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM7:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    br label [[OMP_PARALLEL:%.*]]
 | |
| ; CHECK:       omp_parallel:
 | |
| ; CHECK-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB1]], i32 3, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*, i32*, i32*)* @merge_3_seq..omp_par to void (i32*, i32*, ...)*), i32* [[A_ADDR]], i32* [[ADD_SEQ_OUTPUT_ALLOC]], i32* [[ADD1_SEQ_OUTPUT_ALLOC]])
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT:%.*]]
 | |
| ; CHECK:       omp.par.outlined.exit:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_EXIT_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.exit.split:
 | |
| ; CHECK-NEXT:    br label [[ENTRY_SPLIT_SPLIT:%.*]]
 | |
| ; CHECK:       entry.split.split:
 | |
| ; CHECK-NEXT:    [[ADD1_SEQ_OUTPUT_LOAD:%.*]] = load i32, i32* [[ADD1_SEQ_OUTPUT_ALLOC]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[ADD1_SEQ_OUTPUT_LOAD]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@merge_3_seq..omp_par
 | |
| ; CHECK-SAME: (i32* noalias [[TID_ADDR:%.*]], i32* noalias [[ZERO_ADDR:%.*]], i32* [[A_ADDR:%.*]], i32* [[ADD_SEQ_OUTPUT_ALLOC:%.*]], i32* [[ADD1_SEQ_OUTPUT_ALLOC:%.*]]) #[[ATTR0]] {
 | |
| ; CHECK-NEXT:  omp.par.entry:
 | |
| ; CHECK-NEXT:    [[TID_ADDR_LOCAL:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[TID_ADDR]], align 4
 | |
| ; CHECK-NEXT:    store i32 [[TMP0]], i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK-NEXT:    [[TID:%.*]] = load i32, i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_REGION:%.*]]
 | |
| ; CHECK:       omp.par.outlined.exit.exitStub:
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK:       omp.par.region:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_MERGED:%.*]]
 | |
| ; CHECK:       omp.par.merged:
 | |
| ; CHECK-NEXT:    call void @.omp_outlined..25(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM2:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB2]], i32 [[OMP_GLOBAL_THREAD_NUM2]])
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    [[TMP1:%.*]] = call i32 @__kmpc_master(%struct.ident_t* @[[GLOB1]], i32 [[OMP_GLOBAL_THREAD_NUM]])
 | |
| ; CHECK-NEXT:    [[TMP2:%.*]] = icmp ne i32 [[TMP1]], 0
 | |
| ; CHECK-NEXT:    br i1 [[TMP2]], label [[OMP_REGION_BODY:%.*]], label [[OMP_REGION_END:%.*]]
 | |
| ; CHECK:       omp_region.end:
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM1:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB2]], i32 [[OMP_GLOBAL_THREAD_NUM1]])
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_MERGED_SPLIT_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.merged.split.split:
 | |
| ; CHECK-NEXT:    call void @.omp_outlined..26(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM4:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB2]], i32 [[OMP_GLOBAL_THREAD_NUM4]])
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM3:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    [[TMP3:%.*]] = call i32 @__kmpc_master(%struct.ident_t* @[[GLOB1]], i32 [[OMP_GLOBAL_THREAD_NUM3]])
 | |
| ; CHECK-NEXT:    [[TMP4:%.*]] = icmp ne i32 [[TMP3]], 0
 | |
| ; CHECK-NEXT:    br i1 [[TMP4]], label [[OMP_REGION_BODY5:%.*]], label [[OMP_REGION_END4:%.*]]
 | |
| ; CHECK:       omp_region.end4:
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM6:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB2]], i32 [[OMP_GLOBAL_THREAD_NUM6]])
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_MERGED_SPLIT_SPLIT_SPLIT_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.merged.split.split.split.split:
 | |
| ; CHECK-NEXT:    call void @.omp_outlined..27(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    br label [[ENTRY_SPLIT:%.*]]
 | |
| ; CHECK:       entry.split:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_REGION_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.region.split:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_PRE_FINALIZE:%.*]]
 | |
| ; CHECK:       omp.par.pre_finalize:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT_EXITSTUB:%.*]]
 | |
| ; CHECK:       omp_region.body5:
 | |
| ; CHECK-NEXT:    br label [[SEQ_PAR_MERGED2:%.*]]
 | |
| ; CHECK:       seq.par.merged2:
 | |
| ; CHECK-NEXT:    [[TMP5:%.*]] = load i32, i32* [[A_ADDR]], align 4
 | |
| ; CHECK-NEXT:    [[ADD_SEQ_OUTPUT_LOAD:%.*]] = load i32, i32* [[ADD_SEQ_OUTPUT_ALLOC]], align 4
 | |
| ; CHECK-NEXT:    [[ADD1:%.*]] = add nsw i32 [[ADD_SEQ_OUTPUT_LOAD]], [[TMP5]]
 | |
| ; CHECK-NEXT:    store i32 [[ADD1]], i32* [[ADD1_SEQ_OUTPUT_ALLOC]], align 4
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_MERGED_SPLIT_SPLIT_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.merged.split.split.split:
 | |
| ; CHECK-NEXT:    br label [[OMP_REGION_BODY5_SPLIT:%.*]]
 | |
| ; CHECK:       omp_region.body5.split:
 | |
| ; CHECK-NEXT:    call void @__kmpc_end_master(%struct.ident_t* @[[GLOB1]], i32 [[OMP_GLOBAL_THREAD_NUM3]])
 | |
| ; CHECK-NEXT:    br label [[OMP_REGION_END4]]
 | |
| ; CHECK:       omp_region.body:
 | |
| ; CHECK-NEXT:    br label [[SEQ_PAR_MERGED:%.*]]
 | |
| ; CHECK:       seq.par.merged:
 | |
| ; CHECK-NEXT:    [[TMP6:%.*]] = load i32, i32* [[A_ADDR]], align 4
 | |
| ; CHECK-NEXT:    [[ADD:%.*]] = add nsw i32 [[TMP6]], 1
 | |
| ; CHECK-NEXT:    store i32 [[ADD]], i32* [[ADD_SEQ_OUTPUT_ALLOC]], align 4
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_MERGED_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.merged.split:
 | |
| ; CHECK-NEXT:    br label [[OMP_REGION_BODY_SPLIT:%.*]]
 | |
| ; CHECK:       omp_region.body.split:
 | |
| ; CHECK-NEXT:    call void @__kmpc_end_master(%struct.ident_t* @[[GLOB1]], i32 [[OMP_GLOBAL_THREAD_NUM]])
 | |
| ; CHECK-NEXT:    br label [[OMP_REGION_END]]
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..25
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..26
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..27
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@unmergable_3_seq_call
 | |
| ; CHECK-SAME: (i32 [[A:%.*]]) local_unnamed_addr {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[A_ADDR:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    store i32 [[A]], i32* [[A_ADDR]], align 4
 | |
| ; CHECK-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]], i32 noundef 1, void (i32*, i32*, ...)* noundef bitcast (void (i32*, i32*, i32*)* @.omp_outlined..28 to void (i32*, i32*, ...)*), i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    call void (...) @foo()
 | |
| ; CHECK-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]], i32 noundef 1, void (i32*, i32*, ...)* noundef bitcast (void (i32*, i32*, i32*)* @.omp_outlined..29 to void (i32*, i32*, ...)*), i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    call void (...) @foo()
 | |
| ; CHECK-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]], i32 noundef 1, void (i32*, i32*, ...)* noundef bitcast (void (i32*, i32*, i32*)* @.omp_outlined..30 to void (i32*, i32*, ...)*), i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..28
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..29
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..30
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@unmergable_3_proc_bind
 | |
| ; CHECK-SAME: (i32 [[A:%.*]]) local_unnamed_addr {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[A_ADDR:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]])
 | |
| ; CHECK-NEXT:    store i32 [[A]], i32* [[A_ADDR]], align 4
 | |
| ; CHECK-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]], i32 noundef 1, void (i32*, i32*, ...)* noundef bitcast (void (i32*, i32*, i32*)* @.omp_outlined..31 to void (i32*, i32*, ...)*), i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    call void @__kmpc_push_proc_bind(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]], i32 [[TMP0]], i32 noundef 3)
 | |
| ; CHECK-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]], i32 noundef 1, void (i32*, i32*, ...)* noundef bitcast (void (i32*, i32*, i32*)* @.omp_outlined..32 to void (i32*, i32*, ...)*), i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]], i32 noundef 1, void (i32*, i32*, ...)* noundef bitcast (void (i32*, i32*, i32*)* @.omp_outlined..33 to void (i32*, i32*, ...)*), i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..31
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..32
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..33
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@unmergable_3_num_threads
 | |
| ; CHECK-SAME: (i32 [[A:%.*]]) local_unnamed_addr {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[A_ADDR:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]])
 | |
| ; CHECK-NEXT:    store i32 [[A]], i32* [[A_ADDR]], align 4
 | |
| ; CHECK-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]], i32 noundef 1, void (i32*, i32*, ...)* noundef bitcast (void (i32*, i32*, i32*)* @.omp_outlined..34 to void (i32*, i32*, ...)*), i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    [[TMP1:%.*]] = load i32, i32* [[A_ADDR]], align 4
 | |
| ; CHECK-NEXT:    call void @__kmpc_push_num_threads(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]], i32 [[TMP0]], i32 [[TMP1]])
 | |
| ; CHECK-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]], i32 noundef 1, void (i32*, i32*, ...)* noundef bitcast (void (i32*, i32*, i32*)* @.omp_outlined..35 to void (i32*, i32*, ...)*), i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]], i32 noundef 1, void (i32*, i32*, ...)* noundef bitcast (void (i32*, i32*, i32*)* @.omp_outlined..36 to void (i32*, i32*, ...)*), i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..34
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..35
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..36
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@merge_2_unmergable_1
 | |
| ; CHECK-SAME: (i32 [[A:%.*]]) local_unnamed_addr {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[A_ADDR:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    store i32 [[A]], i32* [[A_ADDR]], align 4
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    br label [[OMP_PARALLEL:%.*]]
 | |
| ; CHECK:       omp_parallel:
 | |
| ; CHECK-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB1]], i32 1, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*)* @merge_2_unmergable_1..omp_par to void (i32*, i32*, ...)*), i32* [[A_ADDR]])
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT:%.*]]
 | |
| ; CHECK:       omp.par.outlined.exit:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_EXIT_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.exit.split:
 | |
| ; CHECK-NEXT:    br label [[ENTRY_SPLIT_SPLIT:%.*]]
 | |
| ; CHECK:       entry.split.split:
 | |
| ; CHECK-NEXT:    call void (...) @foo()
 | |
| ; CHECK-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]], i32 noundef 1, void (i32*, i32*, ...)* noundef bitcast (void (i32*, i32*, i32*)* @.omp_outlined..39 to void (i32*, i32*, ...)*), i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@merge_2_unmergable_1..omp_par
 | |
| ; CHECK-SAME: (i32* noalias [[TID_ADDR:%.*]], i32* noalias [[ZERO_ADDR:%.*]], i32* [[A_ADDR:%.*]]) #[[ATTR0]] {
 | |
| ; CHECK-NEXT:  omp.par.entry:
 | |
| ; CHECK-NEXT:    [[TID_ADDR_LOCAL:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[TID_ADDR]], align 4
 | |
| ; CHECK-NEXT:    store i32 [[TMP0]], i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK-NEXT:    [[TID:%.*]] = load i32, i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_REGION:%.*]]
 | |
| ; CHECK:       omp.par.outlined.exit.exitStub:
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK:       omp.par.region:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_MERGED:%.*]]
 | |
| ; CHECK:       omp.par.merged:
 | |
| ; CHECK-NEXT:    call void @.omp_outlined..37(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB2]], i32 [[OMP_GLOBAL_THREAD_NUM]])
 | |
| ; CHECK-NEXT:    call void @.omp_outlined..38(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    br label [[ENTRY_SPLIT:%.*]]
 | |
| ; CHECK:       entry.split:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_REGION_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.region.split:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_PRE_FINALIZE:%.*]]
 | |
| ; CHECK:       omp.par.pre_finalize:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT_EXITSTUB:%.*]]
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..37
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..38
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..39
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@merge
 | |
| ; CHECK-SAME: (i32 [[A:%.*]]) local_unnamed_addr {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[A_ADDR:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    store i32 [[A]], i32* [[A_ADDR]], align 4
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    br label [[OMP_PARALLEL:%.*]]
 | |
| ; CHECK:       omp_parallel:
 | |
| ; CHECK-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB1]], i32 1, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*)* @merge..omp_par to void (i32*, i32*, ...)*), i32* [[A_ADDR]])
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT:%.*]]
 | |
| ; CHECK:       omp.par.outlined.exit:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_EXIT_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.exit.split:
 | |
| ; CHECK-NEXT:    br label [[ENTRY_SPLIT_SPLIT:%.*]]
 | |
| ; CHECK:       entry.split.split:
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@merge..omp_par
 | |
| ; CHECK-SAME: (i32* noalias [[TID_ADDR:%.*]], i32* noalias [[ZERO_ADDR:%.*]], i32* [[A_ADDR:%.*]]) #[[ATTR0]] {
 | |
| ; CHECK-NEXT:  omp.par.entry:
 | |
| ; CHECK-NEXT:    [[TID_ADDR_LOCAL:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[TID_ADDR]], align 4
 | |
| ; CHECK-NEXT:    store i32 [[TMP0]], i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK-NEXT:    [[TID:%.*]] = load i32, i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_REGION:%.*]]
 | |
| ; CHECK:       omp.par.outlined.exit.exitStub:
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK:       omp.par.region:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_MERGED:%.*]]
 | |
| ; CHECK:       omp.par.merged:
 | |
| ; CHECK-NEXT:    call void @.omp_outlined.(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB2]], i32 [[OMP_GLOBAL_THREAD_NUM]])
 | |
| ; CHECK-NEXT:    call void @.omp_outlined..1(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    br label [[ENTRY_SPLIT:%.*]]
 | |
| ; CHECK:       entry.split:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_REGION_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.region.split:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_PRE_FINALIZE:%.*]]
 | |
| ; CHECK:       omp.par.pre_finalize:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT_EXITSTUB:%.*]]
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined.
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..1
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@unmergable_proc_bind
 | |
| ; CHECK-SAME: (i32 [[A:%.*]]) local_unnamed_addr {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[A_ADDR:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]])
 | |
| ; CHECK-NEXT:    store i32 [[A]], i32* [[A_ADDR]], align 4
 | |
| ; CHECK-NEXT:    call void @__kmpc_push_proc_bind(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]], i32 [[TMP0]], i32 noundef 3)
 | |
| ; CHECK-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]], i32 noundef 1, void (i32*, i32*, ...)* noundef bitcast (void (i32*, i32*, i32*)* @.omp_outlined..2 to void (i32*, i32*, ...)*), i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]], i32 noundef 1, void (i32*, i32*, ...)* noundef bitcast (void (i32*, i32*, i32*)* @.omp_outlined..3 to void (i32*, i32*, ...)*), i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..2
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..3
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@unmergable_num_threads
 | |
| ; CHECK-SAME: (i32 [[A:%.*]]) local_unnamed_addr {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[A_ADDR:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]])
 | |
| ; CHECK-NEXT:    store i32 [[A]], i32* [[A_ADDR]], align 4
 | |
| ; CHECK-NEXT:    call void @__kmpc_push_num_threads(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]], i32 [[TMP0]], i32 [[A]])
 | |
| ; CHECK-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]], i32 noundef 1, void (i32*, i32*, ...)* noundef bitcast (void (i32*, i32*, i32*)* @.omp_outlined..4 to void (i32*, i32*, ...)*), i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]], i32 noundef 1, void (i32*, i32*, ...)* noundef bitcast (void (i32*, i32*, i32*)* @.omp_outlined..5 to void (i32*, i32*, ...)*), i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..4
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..5
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@unmergable_seq_call
 | |
| ; CHECK-SAME: (i32 [[A:%.*]]) local_unnamed_addr {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[A_ADDR:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    store i32 [[A]], i32* [[A_ADDR]], align 4
 | |
| ; CHECK-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]], i32 noundef 1, void (i32*, i32*, ...)* noundef bitcast (void (i32*, i32*, i32*)* @.omp_outlined..6 to void (i32*, i32*, ...)*), i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    call void (...) @foo()
 | |
| ; CHECK-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]], i32 noundef 1, void (i32*, i32*, ...)* noundef bitcast (void (i32*, i32*, i32*)* @.omp_outlined..7 to void (i32*, i32*, ...)*), i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..6
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..7
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@merge_seq
 | |
| ; CHECK-SAME: (i32 [[A:%.*]]) local_unnamed_addr {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[A_ADDR:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    store i32 [[A]], i32* [[A_ADDR]], align 4
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM2:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    br label [[OMP_PARALLEL:%.*]]
 | |
| ; CHECK:       omp_parallel:
 | |
| ; CHECK-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB1]], i32 1, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*)* @merge_seq..omp_par to void (i32*, i32*, ...)*), i32* [[A_ADDR]])
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT:%.*]]
 | |
| ; CHECK:       omp.par.outlined.exit:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_EXIT_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.exit.split:
 | |
| ; CHECK-NEXT:    br label [[ENTRY_SPLIT_SPLIT:%.*]]
 | |
| ; CHECK:       entry.split.split:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A_ADDR]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@merge_seq..omp_par
 | |
| ; CHECK-SAME: (i32* noalias [[TID_ADDR:%.*]], i32* noalias [[ZERO_ADDR:%.*]], i32* [[A_ADDR:%.*]]) #[[ATTR0]] {
 | |
| ; CHECK-NEXT:  omp.par.entry:
 | |
| ; CHECK-NEXT:    [[TID_ADDR_LOCAL:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[TID_ADDR]], align 4
 | |
| ; CHECK-NEXT:    store i32 [[TMP0]], i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK-NEXT:    [[TID:%.*]] = load i32, i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_REGION:%.*]]
 | |
| ; CHECK:       omp.par.outlined.exit.exitStub:
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK:       omp.par.region:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_MERGED:%.*]]
 | |
| ; CHECK:       omp.par.merged:
 | |
| ; CHECK-NEXT:    call void @.omp_outlined..8(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM2:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB2]], i32 [[OMP_GLOBAL_THREAD_NUM2]])
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    [[TMP1:%.*]] = call i32 @__kmpc_master(%struct.ident_t* @[[GLOB1]], i32 [[OMP_GLOBAL_THREAD_NUM]])
 | |
| ; CHECK-NEXT:    [[TMP2:%.*]] = icmp ne i32 [[TMP1]], 0
 | |
| ; CHECK-NEXT:    br i1 [[TMP2]], label [[OMP_REGION_BODY:%.*]], label [[OMP_REGION_END:%.*]]
 | |
| ; CHECK:       omp_region.end:
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM1:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB2]], i32 [[OMP_GLOBAL_THREAD_NUM1]])
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_MERGED_SPLIT_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.merged.split.split:
 | |
| ; CHECK-NEXT:    call void @.omp_outlined..9(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    br label [[ENTRY_SPLIT:%.*]]
 | |
| ; CHECK:       entry.split:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_REGION_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.region.split:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_PRE_FINALIZE:%.*]]
 | |
| ; CHECK:       omp.par.pre_finalize:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT_EXITSTUB:%.*]]
 | |
| ; CHECK:       omp_region.body:
 | |
| ; CHECK-NEXT:    br label [[SEQ_PAR_MERGED:%.*]]
 | |
| ; CHECK:       seq.par.merged:
 | |
| ; CHECK-NEXT:    [[TMP3:%.*]] = load i32, i32* [[A_ADDR]], align 4
 | |
| ; CHECK-NEXT:    [[ADD:%.*]] = add nsw i32 [[TMP3]], 1
 | |
| ; CHECK-NEXT:    store i32 [[ADD]], i32* [[A_ADDR]], align 4
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_MERGED_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.merged.split:
 | |
| ; CHECK-NEXT:    br label [[OMP_REGION_BODY_SPLIT:%.*]]
 | |
| ; CHECK:       omp_region.body.split:
 | |
| ; CHECK-NEXT:    call void @__kmpc_end_master(%struct.ident_t* @[[GLOB1]], i32 [[OMP_GLOBAL_THREAD_NUM]])
 | |
| ; CHECK-NEXT:    br label [[OMP_REGION_END]]
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..8
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..9
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@merge_seq_float
 | |
| ; CHECK-SAME: (float [[F:%.*]], float* nocapture nofree writeonly [[P:%.*]]) local_unnamed_addr {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[F_ADDR:%.*]] = alloca float, align 4
 | |
| ; CHECK-NEXT:    store float [[F]], float* [[F_ADDR]], align 4
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM2:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    br label [[OMP_PARALLEL:%.*]]
 | |
| ; CHECK:       omp_parallel:
 | |
| ; CHECK-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB1]], i32 2, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, float*, float*)* @merge_seq_float..omp_par to void (i32*, i32*, ...)*), float* [[F_ADDR]], float* [[P]])
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT:%.*]]
 | |
| ; CHECK:       omp.par.outlined.exit:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_EXIT_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.exit.split:
 | |
| ; CHECK-NEXT:    br label [[ENTRY_SPLIT_SPLIT:%.*]]
 | |
| ; CHECK:       entry.split.split:
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@merge_seq_float..omp_par
 | |
| ; CHECK-SAME: (i32* noalias [[TID_ADDR:%.*]], i32* noalias [[ZERO_ADDR:%.*]], float* [[F_ADDR:%.*]], float* [[P:%.*]]) #[[ATTR0]] {
 | |
| ; CHECK-NEXT:  omp.par.entry:
 | |
| ; CHECK-NEXT:    [[TID_ADDR_LOCAL:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[TID_ADDR]], align 4
 | |
| ; CHECK-NEXT:    store i32 [[TMP0]], i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK-NEXT:    [[TID:%.*]] = load i32, i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_REGION:%.*]]
 | |
| ; CHECK:       omp.par.outlined.exit.exitStub:
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK:       omp.par.region:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_MERGED:%.*]]
 | |
| ; CHECK:       omp.par.merged:
 | |
| ; CHECK-NEXT:    call void @.omp_outlined..10(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], float* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[F_ADDR]])
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM2:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB2]], i32 [[OMP_GLOBAL_THREAD_NUM2]])
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    [[TMP1:%.*]] = call i32 @__kmpc_master(%struct.ident_t* @[[GLOB1]], i32 [[OMP_GLOBAL_THREAD_NUM]])
 | |
| ; CHECK-NEXT:    [[TMP2:%.*]] = icmp ne i32 [[TMP1]], 0
 | |
| ; CHECK-NEXT:    br i1 [[TMP2]], label [[OMP_REGION_BODY:%.*]], label [[OMP_REGION_END:%.*]]
 | |
| ; CHECK:       omp_region.end:
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM1:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB2]], i32 [[OMP_GLOBAL_THREAD_NUM1]])
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_MERGED_SPLIT_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.merged.split.split:
 | |
| ; CHECK-NEXT:    call void @.omp_outlined..11(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], float* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[F_ADDR]])
 | |
| ; CHECK-NEXT:    br label [[ENTRY_SPLIT:%.*]]
 | |
| ; CHECK:       entry.split:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_REGION_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.region.split:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_PRE_FINALIZE:%.*]]
 | |
| ; CHECK:       omp.par.pre_finalize:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT_EXITSTUB:%.*]]
 | |
| ; CHECK:       omp_region.body:
 | |
| ; CHECK-NEXT:    br label [[SEQ_PAR_MERGED:%.*]]
 | |
| ; CHECK:       seq.par.merged:
 | |
| ; CHECK-NEXT:    [[TMP3:%.*]] = load float, float* [[F_ADDR]], align 4
 | |
| ; CHECK-NEXT:    [[ADD:%.*]] = fadd float [[TMP3]], 0x40091EB860000000
 | |
| ; CHECK-NEXT:    store float [[ADD]], float* [[P]], align 4
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_MERGED_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.merged.split:
 | |
| ; CHECK-NEXT:    br label [[OMP_REGION_BODY_SPLIT:%.*]]
 | |
| ; CHECK:       omp_region.body.split:
 | |
| ; CHECK-NEXT:    call void @__kmpc_end_master(%struct.ident_t* @[[GLOB1]], i32 [[OMP_GLOBAL_THREAD_NUM]])
 | |
| ; CHECK-NEXT:    br label [[OMP_REGION_END]]
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..10
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], float* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[F:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load float, float* [[F]], align 4
 | |
| ; CHECK-NEXT:    [[CONV:%.*]] = fptosi float [[TMP0]] to i32
 | |
| ; CHECK-NEXT:    call void @use(i32 [[CONV]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..11
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], float* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[F:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load float, float* [[F]], align 4
 | |
| ; CHECK-NEXT:    [[CONV:%.*]] = fptosi float [[TMP0]] to i32
 | |
| ; CHECK-NEXT:    call void @use(i32 [[CONV]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@merge_seq_firstprivate
 | |
| ; CHECK-SAME: (i32 [[A:%.*]]) local_unnamed_addr {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[A_CASTED_SROA_0_0_INSERT_EXT_SEQ_OUTPUT_ALLOC:%.*]] = alloca i64, align 8
 | |
| ; CHECK-NEXT:    [[A_ADDR:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    store i32 [[A]], i32* [[A_ADDR]], align 4
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM2:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    br label [[OMP_PARALLEL:%.*]]
 | |
| ; CHECK:       omp_parallel:
 | |
| ; CHECK-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB1]], i32 2, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*, i64*)* @merge_seq_firstprivate..omp_par to void (i32*, i32*, ...)*), i32* [[A_ADDR]], i64* [[A_CASTED_SROA_0_0_INSERT_EXT_SEQ_OUTPUT_ALLOC]])
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT:%.*]]
 | |
| ; CHECK:       omp.par.outlined.exit:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_EXIT_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.exit.split:
 | |
| ; CHECK-NEXT:    br label [[ENTRY_SPLIT_SPLIT:%.*]]
 | |
| ; CHECK:       entry.split.split:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A_ADDR]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@merge_seq_firstprivate..omp_par
 | |
| ; CHECK-SAME: (i32* noalias [[TID_ADDR:%.*]], i32* noalias [[ZERO_ADDR:%.*]], i32* [[A_ADDR:%.*]], i64* [[A_CASTED_SROA_0_0_INSERT_EXT_SEQ_OUTPUT_ALLOC:%.*]]) #[[ATTR0]] {
 | |
| ; CHECK-NEXT:  omp.par.entry:
 | |
| ; CHECK-NEXT:    [[TID_ADDR_LOCAL:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[TID_ADDR]], align 4
 | |
| ; CHECK-NEXT:    store i32 [[TMP0]], i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK-NEXT:    [[TID:%.*]] = load i32, i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_REGION:%.*]]
 | |
| ; CHECK:       omp.par.outlined.exit.exitStub:
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK:       omp.par.region:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_MERGED:%.*]]
 | |
| ; CHECK:       omp.par.merged:
 | |
| ; CHECK-NEXT:    call void @.omp_outlined..12(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM2:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB2]], i32 [[OMP_GLOBAL_THREAD_NUM2]])
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    [[TMP1:%.*]] = call i32 @__kmpc_master(%struct.ident_t* @[[GLOB1]], i32 [[OMP_GLOBAL_THREAD_NUM]])
 | |
| ; CHECK-NEXT:    [[TMP2:%.*]] = icmp ne i32 [[TMP1]], 0
 | |
| ; CHECK-NEXT:    br i1 [[TMP2]], label [[OMP_REGION_BODY:%.*]], label [[OMP_REGION_END:%.*]]
 | |
| ; CHECK:       omp_region.end:
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM1:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB2]], i32 [[OMP_GLOBAL_THREAD_NUM1]])
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_MERGED_SPLIT_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.merged.split.split:
 | |
| ; CHECK-NEXT:    [[A_CASTED_SROA_0_0_INSERT_EXT_SEQ_OUTPUT_LOAD:%.*]] = load i64, i64* [[A_CASTED_SROA_0_0_INSERT_EXT_SEQ_OUTPUT_ALLOC]], align 8
 | |
| ; CHECK-NEXT:    call void @.omp_outlined..13(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i64 [[A_CASTED_SROA_0_0_INSERT_EXT_SEQ_OUTPUT_LOAD]])
 | |
| ; CHECK-NEXT:    br label [[ENTRY_SPLIT:%.*]]
 | |
| ; CHECK:       entry.split:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_REGION_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.region.split:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_PRE_FINALIZE:%.*]]
 | |
| ; CHECK:       omp.par.pre_finalize:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT_EXITSTUB:%.*]]
 | |
| ; CHECK:       omp_region.body:
 | |
| ; CHECK-NEXT:    br label [[SEQ_PAR_MERGED:%.*]]
 | |
| ; CHECK:       seq.par.merged:
 | |
| ; CHECK-NEXT:    [[TMP3:%.*]] = load i32, i32* [[A_ADDR]], align 4
 | |
| ; CHECK-NEXT:    [[ADD:%.*]] = add nsw i32 [[TMP3]], 1
 | |
| ; CHECK-NEXT:    store i32 [[ADD]], i32* [[A_ADDR]], align 4
 | |
| ; CHECK-NEXT:    [[A_CASTED_SROA_0_0_INSERT_EXT:%.*]] = zext i32 [[ADD]] to i64
 | |
| ; CHECK-NEXT:    store i64 [[A_CASTED_SROA_0_0_INSERT_EXT]], i64* [[A_CASTED_SROA_0_0_INSERT_EXT_SEQ_OUTPUT_ALLOC]], align 8
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_MERGED_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.merged.split:
 | |
| ; CHECK-NEXT:    br label [[OMP_REGION_BODY_SPLIT:%.*]]
 | |
| ; CHECK:       omp_region.body.split:
 | |
| ; CHECK-NEXT:    call void @__kmpc_end_master(%struct.ident_t* @[[GLOB1]], i32 [[OMP_GLOBAL_THREAD_NUM]])
 | |
| ; CHECK-NEXT:    br label [[OMP_REGION_END]]
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..12
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..13
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i64 [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[A_ADDR_SROA_0_0_EXTRACT_TRUNC:%.*]] = trunc i64 [[A]] to i32
 | |
| ; CHECK-NEXT:    call void @use(i32 [[A_ADDR_SROA_0_0_EXTRACT_TRUNC]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@merge_seq_sink_lt
 | |
| ; CHECK-SAME: (i32 [[A:%.*]]) local_unnamed_addr {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[A_ADDR:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    store i32 [[A]], i32* [[A_ADDR]], align 4
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM2:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    br label [[OMP_PARALLEL:%.*]]
 | |
| ; CHECK:       omp_parallel:
 | |
| ; CHECK-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB1]], i32 1, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*)* @merge_seq_sink_lt..omp_par to void (i32*, i32*, ...)*), i32* [[A_ADDR]])
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT:%.*]]
 | |
| ; CHECK:       omp.par.outlined.exit:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_EXIT_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.exit.split:
 | |
| ; CHECK-NEXT:    br label [[ENTRY_SPLIT_SPLIT:%.*]]
 | |
| ; CHECK:       entry.split.split:
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@merge_seq_sink_lt..omp_par
 | |
| ; CHECK-SAME: (i32* noalias [[TID_ADDR:%.*]], i32* noalias [[ZERO_ADDR:%.*]], i32* [[A_ADDR:%.*]]) #[[ATTR0]] {
 | |
| ; CHECK-NEXT:  omp.par.entry:
 | |
| ; CHECK-NEXT:    [[B:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    [[TID_ADDR_LOCAL:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[TID_ADDR]], align 4
 | |
| ; CHECK-NEXT:    store i32 [[TMP0]], i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK-NEXT:    [[TID:%.*]] = load i32, i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_REGION:%.*]]
 | |
| ; CHECK:       omp.par.outlined.exit.exitStub:
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK:       omp.par.region:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_MERGED:%.*]]
 | |
| ; CHECK:       omp.par.merged:
 | |
| ; CHECK-NEXT:    call void @.omp_outlined..14(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM2:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB2]], i32 [[OMP_GLOBAL_THREAD_NUM2]])
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    [[TMP1:%.*]] = call i32 @__kmpc_master(%struct.ident_t* @[[GLOB1]], i32 [[OMP_GLOBAL_THREAD_NUM]])
 | |
| ; CHECK-NEXT:    [[TMP2:%.*]] = icmp ne i32 [[TMP1]], 0
 | |
| ; CHECK-NEXT:    br i1 [[TMP2]], label [[OMP_REGION_BODY:%.*]], label [[OMP_REGION_END:%.*]]
 | |
| ; CHECK:       omp_region.end:
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM1:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB2]], i32 [[OMP_GLOBAL_THREAD_NUM1]])
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_MERGED_SPLIT_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.merged.split.split:
 | |
| ; CHECK-NEXT:    call void @.omp_outlined..15(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    br label [[ENTRY_SPLIT:%.*]]
 | |
| ; CHECK:       entry.split:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_REGION_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.region.split:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_PRE_FINALIZE:%.*]]
 | |
| ; CHECK:       omp.par.pre_finalize:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT_EXITSTUB:%.*]]
 | |
| ; CHECK:       omp_region.body:
 | |
| ; CHECK-NEXT:    br label [[SEQ_PAR_MERGED:%.*]]
 | |
| ; CHECK:       seq.par.merged:
 | |
| ; CHECK-NEXT:    [[TMP3:%.*]] = bitcast i32* [[B]] to i8*
 | |
| ; CHECK-NEXT:    call void @llvm.lifetime.start.p0i8(i64 noundef 4, i8* noundef nonnull [[TMP3]])
 | |
| ; CHECK-NEXT:    [[TMP4:%.*]] = ptrtoint i32* [[B]] to i64
 | |
| ; CHECK-NEXT:    [[TMP5:%.*]] = trunc i64 [[TMP4]] to i32
 | |
| ; CHECK-NEXT:    store i32 [[TMP5]], i32* [[B]], align 4
 | |
| ; CHECK-NEXT:    call void @llvm.lifetime.end.p0i8(i64 noundef 4, i8* noundef nonnull [[TMP3]])
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_MERGED_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.merged.split:
 | |
| ; CHECK-NEXT:    br label [[OMP_REGION_BODY_SPLIT:%.*]]
 | |
| ; CHECK:       omp_region.body.split:
 | |
| ; CHECK-NEXT:    call void @__kmpc_end_master(%struct.ident_t* @[[GLOB1]], i32 [[OMP_GLOBAL_THREAD_NUM]])
 | |
| ; CHECK-NEXT:    br label [[OMP_REGION_END]]
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..14
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..15
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@merge_seq_par_use
 | |
| ; CHECK-SAME: (i32 [[A:%.*]]) local_unnamed_addr {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[A_ADDR:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    [[B:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    store i32 [[A]], i32* [[A_ADDR]], align 4
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM2:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    br label [[OMP_PARALLEL:%.*]]
 | |
| ; CHECK:       omp_parallel:
 | |
| ; CHECK-NEXT:    [[LT_CAST3:%.*]] = bitcast i32* [[B]] to i8*
 | |
| ; CHECK-NEXT:    call void @llvm.lifetime.start.p0i8(i64 -1, i8* [[LT_CAST3]])
 | |
| ; CHECK-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB1]], i32 2, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*, i32*)* @merge_seq_par_use..omp_par to void (i32*, i32*, ...)*), i32* [[A_ADDR]], i32* [[B]])
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT:%.*]]
 | |
| ; CHECK:       omp.par.outlined.exit:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_EXIT_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.exit.split:
 | |
| ; CHECK-NEXT:    br label [[ENTRY_SPLIT_SPLIT:%.*]]
 | |
| ; CHECK:       entry.split.split:
 | |
| ; CHECK-NEXT:    [[LT_CAST:%.*]] = bitcast i32* [[B]] to i8*
 | |
| ; CHECK-NEXT:    call void @llvm.lifetime.end.p0i8(i64 noundef 4, i8* noundef nonnull [[LT_CAST]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@merge_seq_par_use..omp_par
 | |
| ; CHECK-SAME: (i32* noalias [[TID_ADDR:%.*]], i32* noalias [[ZERO_ADDR:%.*]], i32* [[A_ADDR:%.*]], i32* [[B:%.*]]) #[[ATTR0]] {
 | |
| ; CHECK-NEXT:  omp.par.entry:
 | |
| ; CHECK-NEXT:    [[TID_ADDR_LOCAL:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[TID_ADDR]], align 4
 | |
| ; CHECK-NEXT:    store i32 [[TMP0]], i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK-NEXT:    [[TID:%.*]] = load i32, i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_REGION:%.*]]
 | |
| ; CHECK:       omp.par.outlined.exit.exitStub:
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK:       omp.par.region:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_MERGED:%.*]]
 | |
| ; CHECK:       omp.par.merged:
 | |
| ; CHECK-NEXT:    call void @.omp_outlined..16(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM2:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB2]], i32 [[OMP_GLOBAL_THREAD_NUM2]])
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    [[TMP1:%.*]] = call i32 @__kmpc_master(%struct.ident_t* @[[GLOB1]], i32 [[OMP_GLOBAL_THREAD_NUM]])
 | |
| ; CHECK-NEXT:    [[TMP2:%.*]] = icmp ne i32 [[TMP1]], 0
 | |
| ; CHECK-NEXT:    br i1 [[TMP2]], label [[OMP_REGION_BODY:%.*]], label [[OMP_REGION_END:%.*]]
 | |
| ; CHECK:       omp_region.end:
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM1:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB2]], i32 [[OMP_GLOBAL_THREAD_NUM1]])
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_MERGED_SPLIT_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.merged.split.split:
 | |
| ; CHECK-NEXT:    call void @.omp_outlined..17(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[B]])
 | |
| ; CHECK-NEXT:    br label [[ENTRY_SPLIT:%.*]]
 | |
| ; CHECK:       entry.split:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_REGION_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.region.split:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_PRE_FINALIZE:%.*]]
 | |
| ; CHECK:       omp.par.pre_finalize:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT_EXITSTUB:%.*]]
 | |
| ; CHECK:       omp_region.body:
 | |
| ; CHECK-NEXT:    br label [[SEQ_PAR_MERGED:%.*]]
 | |
| ; CHECK:       seq.par.merged:
 | |
| ; CHECK-NEXT:    [[TMP3:%.*]] = bitcast i32* [[B]] to i8*
 | |
| ; CHECK-NEXT:    [[TMP4:%.*]] = load i32, i32* [[A_ADDR]], align 4
 | |
| ; CHECK-NEXT:    [[ADD:%.*]] = add nsw i32 [[TMP4]], 1
 | |
| ; CHECK-NEXT:    store i32 [[ADD]], i32* [[B]], align 4
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_MERGED_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.merged.split:
 | |
| ; CHECK-NEXT:    br label [[OMP_REGION_BODY_SPLIT:%.*]]
 | |
| ; CHECK:       omp_region.body.split:
 | |
| ; CHECK-NEXT:    call void @__kmpc_end_master(%struct.ident_t* @[[GLOB1]], i32 [[OMP_GLOBAL_THREAD_NUM]])
 | |
| ; CHECK-NEXT:    br label [[OMP_REGION_END]]
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..16
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..17
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[B:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    [[TMP1:%.*]] = load i32, i32* [[B]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP1]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@merge_cancellable_regions
 | |
| ; CHECK-SAME: (i32 [[CANCEL1:%.*]], i32 [[CANCEL2:%.*]]) local_unnamed_addr {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[CANCEL1_ADDR:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    [[CANCEL2_ADDR:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    store i32 [[CANCEL1]], i32* [[CANCEL1_ADDR]], align 4
 | |
| ; CHECK-NEXT:    store i32 [[CANCEL2]], i32* [[CANCEL2_ADDR]], align 4
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    br label [[OMP_PARALLEL:%.*]]
 | |
| ; CHECK:       omp_parallel:
 | |
| ; CHECK-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB1]], i32 2, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*, i32*)* @merge_cancellable_regions..omp_par to void (i32*, i32*, ...)*), i32* [[CANCEL1_ADDR]], i32* [[CANCEL2_ADDR]])
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT:%.*]]
 | |
| ; CHECK:       omp.par.outlined.exit:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_EXIT_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.exit.split:
 | |
| ; CHECK-NEXT:    br label [[ENTRY_SPLIT_SPLIT:%.*]]
 | |
| ; CHECK:       entry.split.split:
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@merge_cancellable_regions..omp_par
 | |
| ; CHECK-SAME: (i32* noalias [[TID_ADDR:%.*]], i32* noalias [[ZERO_ADDR:%.*]], i32* [[CANCEL1_ADDR:%.*]], i32* [[CANCEL2_ADDR:%.*]]) #[[ATTR0]] {
 | |
| ; CHECK-NEXT:  omp.par.entry:
 | |
| ; CHECK-NEXT:    [[TID_ADDR_LOCAL:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[TID_ADDR]], align 4
 | |
| ; CHECK-NEXT:    store i32 [[TMP0]], i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK-NEXT:    [[TID:%.*]] = load i32, i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_REGION:%.*]]
 | |
| ; CHECK:       omp.par.outlined.exit.exitStub:
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK:       omp.par.region:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_MERGED:%.*]]
 | |
| ; CHECK:       omp.par.merged:
 | |
| ; CHECK-NEXT:    call void @.omp_outlined..18(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[CANCEL1_ADDR]])
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB2]], i32 [[OMP_GLOBAL_THREAD_NUM]])
 | |
| ; CHECK-NEXT:    call void @.omp_outlined..19(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[CANCEL2_ADDR]])
 | |
| ; CHECK-NEXT:    br label [[ENTRY_SPLIT:%.*]]
 | |
| ; CHECK:       entry.split:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_REGION_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.region.split:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_PRE_FINALIZE:%.*]]
 | |
| ; CHECK:       omp.par.pre_finalize:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT_EXITSTUB:%.*]]
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..18
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readonly [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[CANCEL1:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[CANCEL1]], align 4
 | |
| ; CHECK-NEXT:    [[TOBOOL_NOT:%.*]] = icmp eq i32 [[TMP0]], 0
 | |
| ; CHECK-NEXT:    br i1 [[TOBOOL_NOT]], label [[IF_END:%.*]], label [[IF_THEN:%.*]]
 | |
| ; CHECK:       if.then:
 | |
| ; CHECK-NEXT:    [[TMP1:%.*]] = load i32, i32* [[DOTGLOBAL_TID_]], align 4
 | |
| ; CHECK-NEXT:    [[TMP2:%.*]] = call i32 @__kmpc_cancel(%struct.ident_t* noundef nonnull @[[GLOB1]], i32 [[TMP1]], i32 noundef 1)
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK:       if.end:
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..19
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readonly [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[CANCEL2:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[CANCEL2]], align 4
 | |
| ; CHECK-NEXT:    [[TOBOOL_NOT:%.*]] = icmp eq i32 [[TMP0]], 0
 | |
| ; CHECK-NEXT:    br i1 [[TOBOOL_NOT]], label [[IF_END:%.*]], label [[IF_THEN:%.*]]
 | |
| ; CHECK:       if.then:
 | |
| ; CHECK-NEXT:    [[TMP1:%.*]] = load i32, i32* [[DOTGLOBAL_TID_]], align 4
 | |
| ; CHECK-NEXT:    [[TMP2:%.*]] = call i32 @__kmpc_cancel(%struct.ident_t* noundef nonnull @[[GLOB1]], i32 [[TMP1]], i32 noundef 1)
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK:       if.end:
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@merge_cancellable_regions_seq
 | |
| ; CHECK-SAME: (i32 [[CANCEL1:%.*]], i32 [[CANCEL2:%.*]]) local_unnamed_addr {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[CANCEL1_ADDR:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    [[CANCEL2_ADDR:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    store i32 [[CANCEL1]], i32* [[CANCEL1_ADDR]], align 4
 | |
| ; CHECK-NEXT:    store i32 [[CANCEL2]], i32* [[CANCEL2_ADDR]], align 4
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM2:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    br label [[OMP_PARALLEL:%.*]]
 | |
| ; CHECK:       omp_parallel:
 | |
| ; CHECK-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB1]], i32 2, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*, i32*)* @merge_cancellable_regions_seq..omp_par to void (i32*, i32*, ...)*), i32* [[CANCEL1_ADDR]], i32* [[CANCEL2_ADDR]])
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT:%.*]]
 | |
| ; CHECK:       omp.par.outlined.exit:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_EXIT_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.exit.split:
 | |
| ; CHECK-NEXT:    br label [[ENTRY_SPLIT_SPLIT:%.*]]
 | |
| ; CHECK:       entry.split.split:
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@merge_cancellable_regions_seq..omp_par
 | |
| ; CHECK-SAME: (i32* noalias [[TID_ADDR:%.*]], i32* noalias [[ZERO_ADDR:%.*]], i32* [[CANCEL1_ADDR:%.*]], i32* [[CANCEL2_ADDR:%.*]]) #[[ATTR0]] {
 | |
| ; CHECK-NEXT:  omp.par.entry:
 | |
| ; CHECK-NEXT:    [[TID_ADDR_LOCAL:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[TID_ADDR]], align 4
 | |
| ; CHECK-NEXT:    store i32 [[TMP0]], i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK-NEXT:    [[TID:%.*]] = load i32, i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_REGION:%.*]]
 | |
| ; CHECK:       omp.par.outlined.exit.exitStub:
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK:       omp.par.region:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_MERGED:%.*]]
 | |
| ; CHECK:       omp.par.merged:
 | |
| ; CHECK-NEXT:    call void @.omp_outlined..20(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[CANCEL1_ADDR]])
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM2:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB2]], i32 [[OMP_GLOBAL_THREAD_NUM2]])
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    [[TMP1:%.*]] = call i32 @__kmpc_master(%struct.ident_t* @[[GLOB1]], i32 [[OMP_GLOBAL_THREAD_NUM]])
 | |
| ; CHECK-NEXT:    [[TMP2:%.*]] = icmp ne i32 [[TMP1]], 0
 | |
| ; CHECK-NEXT:    br i1 [[TMP2]], label [[OMP_REGION_BODY:%.*]], label [[OMP_REGION_END:%.*]]
 | |
| ; CHECK:       omp_region.end:
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM1:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB2]], i32 [[OMP_GLOBAL_THREAD_NUM1]])
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_MERGED_SPLIT_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.merged.split.split:
 | |
| ; CHECK-NEXT:    call void @.omp_outlined..21(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[CANCEL2_ADDR]])
 | |
| ; CHECK-NEXT:    br label [[ENTRY_SPLIT:%.*]]
 | |
| ; CHECK:       entry.split:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_REGION_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.region.split:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_PRE_FINALIZE:%.*]]
 | |
| ; CHECK:       omp.par.pre_finalize:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT_EXITSTUB:%.*]]
 | |
| ; CHECK:       omp_region.body:
 | |
| ; CHECK-NEXT:    br label [[SEQ_PAR_MERGED:%.*]]
 | |
| ; CHECK:       seq.par.merged:
 | |
| ; CHECK-NEXT:    [[TMP3:%.*]] = load i32, i32* [[CANCEL1_ADDR]], align 4
 | |
| ; CHECK-NEXT:    [[TOBOOL_NOT:%.*]] = icmp eq i32 [[TMP3]], 0
 | |
| ; CHECK-NEXT:    [[LNOT_EXT:%.*]] = zext i1 [[TOBOOL_NOT]] to i32
 | |
| ; CHECK-NEXT:    store i32 [[LNOT_EXT]], i32* [[CANCEL2_ADDR]], align 4
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_MERGED_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.merged.split:
 | |
| ; CHECK-NEXT:    br label [[OMP_REGION_BODY_SPLIT:%.*]]
 | |
| ; CHECK:       omp_region.body.split:
 | |
| ; CHECK-NEXT:    call void @__kmpc_end_master(%struct.ident_t* @[[GLOB1]], i32 [[OMP_GLOBAL_THREAD_NUM]])
 | |
| ; CHECK-NEXT:    br label [[OMP_REGION_END]]
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..20
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readonly [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[CANCEL1:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[CANCEL1]], align 4
 | |
| ; CHECK-NEXT:    [[TOBOOL_NOT:%.*]] = icmp eq i32 [[TMP0]], 0
 | |
| ; CHECK-NEXT:    br i1 [[TOBOOL_NOT]], label [[IF_END:%.*]], label [[IF_THEN:%.*]]
 | |
| ; CHECK:       if.then:
 | |
| ; CHECK-NEXT:    [[TMP1:%.*]] = load i32, i32* [[DOTGLOBAL_TID_]], align 4
 | |
| ; CHECK-NEXT:    [[TMP2:%.*]] = call i32 @__kmpc_cancel(%struct.ident_t* noundef nonnull @[[GLOB1]], i32 [[TMP1]], i32 noundef 1)
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK:       if.end:
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..21
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readonly [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[CANCEL2:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[CANCEL2]], align 4
 | |
| ; CHECK-NEXT:    [[TOBOOL_NOT:%.*]] = icmp eq i32 [[TMP0]], 0
 | |
| ; CHECK-NEXT:    br i1 [[TOBOOL_NOT]], label [[IF_END:%.*]], label [[IF_THEN:%.*]]
 | |
| ; CHECK:       if.then:
 | |
| ; CHECK-NEXT:    [[TMP1:%.*]] = load i32, i32* [[DOTGLOBAL_TID_]], align 4
 | |
| ; CHECK-NEXT:    [[TMP2:%.*]] = call i32 @__kmpc_cancel(%struct.ident_t* noundef nonnull @[[GLOB1]], i32 [[TMP1]], i32 noundef 1)
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK:       if.end:
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@merge_3
 | |
| ; CHECK-SAME: (i32 [[A:%.*]]) local_unnamed_addr {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[A_ADDR:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    store i32 [[A]], i32* [[A_ADDR]], align 4
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    br label [[OMP_PARALLEL:%.*]]
 | |
| ; CHECK:       omp_parallel:
 | |
| ; CHECK-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB1]], i32 1, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*)* @merge_3..omp_par to void (i32*, i32*, ...)*), i32* [[A_ADDR]])
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT:%.*]]
 | |
| ; CHECK:       omp.par.outlined.exit:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_EXIT_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.exit.split:
 | |
| ; CHECK-NEXT:    br label [[ENTRY_SPLIT_SPLIT:%.*]]
 | |
| ; CHECK:       entry.split.split:
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@merge_3..omp_par
 | |
| ; CHECK-SAME: (i32* noalias [[TID_ADDR:%.*]], i32* noalias [[ZERO_ADDR:%.*]], i32* [[A_ADDR:%.*]]) #[[ATTR0]] {
 | |
| ; CHECK-NEXT:  omp.par.entry:
 | |
| ; CHECK-NEXT:    [[TID_ADDR_LOCAL:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[TID_ADDR]], align 4
 | |
| ; CHECK-NEXT:    store i32 [[TMP0]], i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK-NEXT:    [[TID:%.*]] = load i32, i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_REGION:%.*]]
 | |
| ; CHECK:       omp.par.outlined.exit.exitStub:
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK:       omp.par.region:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_MERGED:%.*]]
 | |
| ; CHECK:       omp.par.merged:
 | |
| ; CHECK-NEXT:    call void @.omp_outlined..22(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB2]], i32 [[OMP_GLOBAL_THREAD_NUM]])
 | |
| ; CHECK-NEXT:    call void @.omp_outlined..23(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM1:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB2]], i32 [[OMP_GLOBAL_THREAD_NUM1]])
 | |
| ; CHECK-NEXT:    call void @.omp_outlined..24(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    br label [[ENTRY_SPLIT:%.*]]
 | |
| ; CHECK:       entry.split:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_REGION_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.region.split:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_PRE_FINALIZE:%.*]]
 | |
| ; CHECK:       omp.par.pre_finalize:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT_EXITSTUB:%.*]]
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..22
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..23
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..24
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@merge_3_seq
 | |
| ; CHECK-SAME: (i32 [[A:%.*]], i32 [[B:%.*]]) local_unnamed_addr {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[ADD1_SEQ_OUTPUT_ALLOC:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    [[ADD_SEQ_OUTPUT_ALLOC:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    [[A_ADDR:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    store i32 [[A]], i32* [[A_ADDR]], align 4
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM7:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    br label [[OMP_PARALLEL:%.*]]
 | |
| ; CHECK:       omp_parallel:
 | |
| ; CHECK-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB1]], i32 3, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*, i32*, i32*)* @merge_3_seq..omp_par to void (i32*, i32*, ...)*), i32* [[A_ADDR]], i32* [[ADD_SEQ_OUTPUT_ALLOC]], i32* [[ADD1_SEQ_OUTPUT_ALLOC]])
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT:%.*]]
 | |
| ; CHECK:       omp.par.outlined.exit:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_EXIT_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.exit.split:
 | |
| ; CHECK-NEXT:    br label [[ENTRY_SPLIT_SPLIT:%.*]]
 | |
| ; CHECK:       entry.split.split:
 | |
| ; CHECK-NEXT:    [[ADD1_SEQ_OUTPUT_LOAD:%.*]] = load i32, i32* [[ADD1_SEQ_OUTPUT_ALLOC]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[ADD1_SEQ_OUTPUT_LOAD]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@merge_3_seq..omp_par
 | |
| ; CHECK-SAME: (i32* noalias [[TID_ADDR:%.*]], i32* noalias [[ZERO_ADDR:%.*]], i32* [[A_ADDR:%.*]], i32* [[ADD_SEQ_OUTPUT_ALLOC:%.*]], i32* [[ADD1_SEQ_OUTPUT_ALLOC:%.*]]) #[[ATTR0]] {
 | |
| ; CHECK-NEXT:  omp.par.entry:
 | |
| ; CHECK-NEXT:    [[TID_ADDR_LOCAL:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[TID_ADDR]], align 4
 | |
| ; CHECK-NEXT:    store i32 [[TMP0]], i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK-NEXT:    [[TID:%.*]] = load i32, i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_REGION:%.*]]
 | |
| ; CHECK:       omp.par.outlined.exit.exitStub:
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK:       omp.par.region:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_MERGED:%.*]]
 | |
| ; CHECK:       omp.par.merged:
 | |
| ; CHECK-NEXT:    call void @.omp_outlined..25(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM2:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB2]], i32 [[OMP_GLOBAL_THREAD_NUM2]])
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    [[TMP1:%.*]] = call i32 @__kmpc_master(%struct.ident_t* @[[GLOB1]], i32 [[OMP_GLOBAL_THREAD_NUM]])
 | |
| ; CHECK-NEXT:    [[TMP2:%.*]] = icmp ne i32 [[TMP1]], 0
 | |
| ; CHECK-NEXT:    br i1 [[TMP2]], label [[OMP_REGION_BODY:%.*]], label [[OMP_REGION_END:%.*]]
 | |
| ; CHECK:       omp_region.end:
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM1:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB2]], i32 [[OMP_GLOBAL_THREAD_NUM1]])
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_MERGED_SPLIT_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.merged.split.split:
 | |
| ; CHECK-NEXT:    call void @.omp_outlined..26(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM4:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB2]], i32 [[OMP_GLOBAL_THREAD_NUM4]])
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM3:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    [[TMP3:%.*]] = call i32 @__kmpc_master(%struct.ident_t* @[[GLOB1]], i32 [[OMP_GLOBAL_THREAD_NUM3]])
 | |
| ; CHECK-NEXT:    [[TMP4:%.*]] = icmp ne i32 [[TMP3]], 0
 | |
| ; CHECK-NEXT:    br i1 [[TMP4]], label [[OMP_REGION_BODY5:%.*]], label [[OMP_REGION_END4:%.*]]
 | |
| ; CHECK:       omp_region.end4:
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM6:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB2]], i32 [[OMP_GLOBAL_THREAD_NUM6]])
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_MERGED_SPLIT_SPLIT_SPLIT_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.merged.split.split.split.split:
 | |
| ; CHECK-NEXT:    call void @.omp_outlined..27(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    br label [[ENTRY_SPLIT:%.*]]
 | |
| ; CHECK:       entry.split:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_REGION_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.region.split:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_PRE_FINALIZE:%.*]]
 | |
| ; CHECK:       omp.par.pre_finalize:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT_EXITSTUB:%.*]]
 | |
| ; CHECK:       omp_region.body5:
 | |
| ; CHECK-NEXT:    br label [[SEQ_PAR_MERGED2:%.*]]
 | |
| ; CHECK:       seq.par.merged2:
 | |
| ; CHECK-NEXT:    [[TMP5:%.*]] = load i32, i32* [[A_ADDR]], align 4
 | |
| ; CHECK-NEXT:    [[ADD_SEQ_OUTPUT_LOAD:%.*]] = load i32, i32* [[ADD_SEQ_OUTPUT_ALLOC]], align 4
 | |
| ; CHECK-NEXT:    [[ADD1:%.*]] = add nsw i32 [[ADD_SEQ_OUTPUT_LOAD]], [[TMP5]]
 | |
| ; CHECK-NEXT:    store i32 [[ADD1]], i32* [[ADD1_SEQ_OUTPUT_ALLOC]], align 4
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_MERGED_SPLIT_SPLIT_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.merged.split.split.split:
 | |
| ; CHECK-NEXT:    br label [[OMP_REGION_BODY5_SPLIT:%.*]]
 | |
| ; CHECK:       omp_region.body5.split:
 | |
| ; CHECK-NEXT:    call void @__kmpc_end_master(%struct.ident_t* @[[GLOB1]], i32 [[OMP_GLOBAL_THREAD_NUM3]])
 | |
| ; CHECK-NEXT:    br label [[OMP_REGION_END4]]
 | |
| ; CHECK:       omp_region.body:
 | |
| ; CHECK-NEXT:    br label [[SEQ_PAR_MERGED:%.*]]
 | |
| ; CHECK:       seq.par.merged:
 | |
| ; CHECK-NEXT:    [[TMP6:%.*]] = load i32, i32* [[A_ADDR]], align 4
 | |
| ; CHECK-NEXT:    [[ADD:%.*]] = add nsw i32 [[TMP6]], 1
 | |
| ; CHECK-NEXT:    store i32 [[ADD]], i32* [[ADD_SEQ_OUTPUT_ALLOC]], align 4
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_MERGED_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.merged.split:
 | |
| ; CHECK-NEXT:    br label [[OMP_REGION_BODY_SPLIT:%.*]]
 | |
| ; CHECK:       omp_region.body.split:
 | |
| ; CHECK-NEXT:    call void @__kmpc_end_master(%struct.ident_t* @[[GLOB1]], i32 [[OMP_GLOBAL_THREAD_NUM]])
 | |
| ; CHECK-NEXT:    br label [[OMP_REGION_END]]
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..25
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..26
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..27
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@unmergable_3_seq_call
 | |
| ; CHECK-SAME: (i32 [[A:%.*]]) local_unnamed_addr {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[A_ADDR:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    store i32 [[A]], i32* [[A_ADDR]], align 4
 | |
| ; CHECK-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]], i32 noundef 1, void (i32*, i32*, ...)* noundef bitcast (void (i32*, i32*, i32*)* @.omp_outlined..28 to void (i32*, i32*, ...)*), i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    call void (...) @foo()
 | |
| ; CHECK-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]], i32 noundef 1, void (i32*, i32*, ...)* noundef bitcast (void (i32*, i32*, i32*)* @.omp_outlined..29 to void (i32*, i32*, ...)*), i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    call void (...) @foo()
 | |
| ; CHECK-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]], i32 noundef 1, void (i32*, i32*, ...)* noundef bitcast (void (i32*, i32*, i32*)* @.omp_outlined..30 to void (i32*, i32*, ...)*), i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..28
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..29
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..30
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@unmergable_3_proc_bind
 | |
| ; CHECK-SAME: (i32 [[A:%.*]]) local_unnamed_addr {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[A_ADDR:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]])
 | |
| ; CHECK-NEXT:    store i32 [[A]], i32* [[A_ADDR]], align 4
 | |
| ; CHECK-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]], i32 noundef 1, void (i32*, i32*, ...)* noundef bitcast (void (i32*, i32*, i32*)* @.omp_outlined..31 to void (i32*, i32*, ...)*), i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    call void @__kmpc_push_proc_bind(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]], i32 [[TMP0]], i32 noundef 3)
 | |
| ; CHECK-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]], i32 noundef 1, void (i32*, i32*, ...)* noundef bitcast (void (i32*, i32*, i32*)* @.omp_outlined..32 to void (i32*, i32*, ...)*), i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]], i32 noundef 1, void (i32*, i32*, ...)* noundef bitcast (void (i32*, i32*, i32*)* @.omp_outlined..33 to void (i32*, i32*, ...)*), i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..31
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..32
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..33
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@unmergable_3_num_threads
 | |
| ; CHECK-SAME: (i32 [[A:%.*]]) local_unnamed_addr {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[A_ADDR:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]])
 | |
| ; CHECK-NEXT:    store i32 [[A]], i32* [[A_ADDR]], align 4
 | |
| ; CHECK-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]], i32 noundef 1, void (i32*, i32*, ...)* noundef bitcast (void (i32*, i32*, i32*)* @.omp_outlined..34 to void (i32*, i32*, ...)*), i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    [[TMP1:%.*]] = load i32, i32* [[A_ADDR]], align 4
 | |
| ; CHECK-NEXT:    call void @__kmpc_push_num_threads(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]], i32 [[TMP0]], i32 [[TMP1]])
 | |
| ; CHECK-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]], i32 noundef 1, void (i32*, i32*, ...)* noundef bitcast (void (i32*, i32*, i32*)* @.omp_outlined..35 to void (i32*, i32*, ...)*), i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]], i32 noundef 1, void (i32*, i32*, ...)* noundef bitcast (void (i32*, i32*, i32*)* @.omp_outlined..36 to void (i32*, i32*, ...)*), i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..34
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..35
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..36
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@merge_2_unmergable_1
 | |
| ; CHECK-SAME: (i32 [[A:%.*]]) local_unnamed_addr {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[A_ADDR:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    store i32 [[A]], i32* [[A_ADDR]], align 4
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    br label [[OMP_PARALLEL:%.*]]
 | |
| ; CHECK:       omp_parallel:
 | |
| ; CHECK-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB1]], i32 1, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*)* @merge_2_unmergable_1..omp_par to void (i32*, i32*, ...)*), i32* [[A_ADDR]])
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT:%.*]]
 | |
| ; CHECK:       omp.par.outlined.exit:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_EXIT_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.exit.split:
 | |
| ; CHECK-NEXT:    br label [[ENTRY_SPLIT_SPLIT:%.*]]
 | |
| ; CHECK:       entry.split.split:
 | |
| ; CHECK-NEXT:    call void (...) @foo()
 | |
| ; CHECK-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]], i32 noundef 1, void (i32*, i32*, ...)* noundef bitcast (void (i32*, i32*, i32*)* @.omp_outlined..39 to void (i32*, i32*, ...)*), i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@merge_2_unmergable_1..omp_par
 | |
| ; CHECK-SAME: (i32* noalias [[TID_ADDR:%.*]], i32* noalias [[ZERO_ADDR:%.*]], i32* [[A_ADDR:%.*]]) #[[ATTR0]] {
 | |
| ; CHECK-NEXT:  omp.par.entry:
 | |
| ; CHECK-NEXT:    [[TID_ADDR_LOCAL:%.*]] = alloca i32, align 4
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[TID_ADDR]], align 4
 | |
| ; CHECK-NEXT:    store i32 [[TMP0]], i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK-NEXT:    [[TID:%.*]] = load i32, i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_REGION:%.*]]
 | |
| ; CHECK:       omp.par.outlined.exit.exitStub:
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK:       omp.par.region:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_MERGED:%.*]]
 | |
| ; CHECK:       omp.par.merged:
 | |
| ; CHECK-NEXT:    call void @.omp_outlined..37(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    [[OMP_GLOBAL_THREAD_NUM:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB1]])
 | |
| ; CHECK-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB2]], i32 [[OMP_GLOBAL_THREAD_NUM]])
 | |
| ; CHECK-NEXT:    call void @.omp_outlined..38(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK-NEXT:    br label [[ENTRY_SPLIT:%.*]]
 | |
| ; CHECK:       entry.split:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_REGION_SPLIT:%.*]]
 | |
| ; CHECK:       omp.par.region.split:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_PRE_FINALIZE:%.*]]
 | |
| ; CHECK:       omp.par.pre_finalize:
 | |
| ; CHECK-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT_EXITSTUB:%.*]]
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..37
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..38
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| ; CHECK-LABEL: define {{[^@]+}}@.omp_outlined..39
 | |
| ; CHECK-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK-NEXT:  entry:
 | |
| ; CHECK-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK-NEXT:    ret void
 | |
| 
 | |
| ; CHECK1-LABEL: define {{[^@]+}}@merge
 | |
| ; CHECK1-SAME: (i32 [[A:%.*]]) local_unnamed_addr {
 | |
| ; CHECK1-NEXT:  entry:
 | |
| ; CHECK1-NEXT:    [[STRUCTARG:%.*]] = alloca { i32* }, align 8
 | |
| ; CHECK1-NEXT:    [[A_ADDR:%.*]] = alloca i32, align 4
 | |
| ; CHECK1-NEXT:    store i32 [[A]], i32* [[A_ADDR]], align 4
 | |
| ; CHECK1-NEXT:    [[OMP_GLOBAL_THREAD_NUM:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB2:[0-9]+]])
 | |
| ; CHECK1-NEXT:    br label [[OMP_PARALLEL:%.*]]
 | |
| ; CHECK1:       omp_parallel:
 | |
| ; CHECK1-NEXT:    [[GEP_A_ADDR:%.*]] = getelementptr { i32* }, { i32* }* [[STRUCTARG]], i32 0, i32 0
 | |
| ; CHECK1-NEXT:    store i32* [[A_ADDR]], i32** [[GEP_A_ADDR]], align 8
 | |
| ; CHECK1-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB2]], i32 1, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, { i32* }*)* @merge..omp_par to void (i32*, i32*, ...)*), { i32* }* [[STRUCTARG]])
 | |
| ; CHECK1-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT:%.*]]
 | |
| ; CHECK1:       omp.par.outlined.exit:
 | |
| ; CHECK1-NEXT:    br label [[OMP_PAR_EXIT_SPLIT:%.*]]
 | |
| ; CHECK1:       omp.par.exit.split:
 | |
| ; CHECK1-NEXT:    br label [[ENTRY_SPLIT_SPLIT:%.*]]
 | |
| ; CHECK1:       entry.split.split:
 | |
| ; CHECK1-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK1-LABEL: define {{[^@]+}}@merge..omp_par
 | |
| ; CHECK1-SAME: (i32* noalias [[TID_ADDR:%.*]], i32* noalias [[ZERO_ADDR:%.*]], { i32* }* [[TMP0:%.*]]) #[[ATTR0:[0-9]+]] {
 | |
| ; CHECK1-NEXT:  omp.par.entry:
 | |
| ; CHECK1-NEXT:    [[GEP_A_ADDR:%.*]] = getelementptr { i32* }, { i32* }* [[TMP0]], i32 0, i32 0
 | |
| ; CHECK1-NEXT:    [[LOADGEP_A_ADDR:%.*]] = load i32*, i32** [[GEP_A_ADDR]], align 8
 | |
| ; CHECK1-NEXT:    [[TID_ADDR_LOCAL:%.*]] = alloca i32, align 4
 | |
| ; CHECK1-NEXT:    [[TMP1:%.*]] = load i32, i32* [[TID_ADDR]], align 4
 | |
| ; CHECK1-NEXT:    store i32 [[TMP1]], i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK1-NEXT:    [[TID:%.*]] = load i32, i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK1-NEXT:    br label [[OMP_PAR_REGION:%.*]]
 | |
| ; CHECK1:       omp.par.region:
 | |
| ; CHECK1-NEXT:    br label [[OMP_PAR_MERGED:%.*]]
 | |
| ; CHECK1:       omp.par.merged:
 | |
| ; CHECK1-NEXT:    call void (i32*, i32*, ...) bitcast (void (i32*, i32*, i32*)* @.omp_outlined. to void (i32*, i32*, ...)*)(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[LOADGEP_A_ADDR]])
 | |
| ; CHECK1-NEXT:    [[OMP_GLOBAL_THREAD_NUM:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB2]])
 | |
| ; CHECK1-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB3:[0-9]+]], i32 [[OMP_GLOBAL_THREAD_NUM]])
 | |
| ; CHECK1-NEXT:    call void (i32*, i32*, ...) bitcast (void (i32*, i32*, i32*)* @.omp_outlined..1 to void (i32*, i32*, ...)*)(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[LOADGEP_A_ADDR]])
 | |
| ; CHECK1-NEXT:    br label [[ENTRY_SPLIT:%.*]]
 | |
| ; CHECK1:       entry.split:
 | |
| ; CHECK1-NEXT:    br label [[OMP_PAR_REGION_SPLIT:%.*]]
 | |
| ; CHECK1:       omp.par.region.split:
 | |
| ; CHECK1-NEXT:    br label [[OMP_PAR_PRE_FINALIZE:%.*]]
 | |
| ; CHECK1:       omp.par.pre_finalize:
 | |
| ; CHECK1-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT_EXITSTUB:%.*]]
 | |
| ; CHECK1:       omp.par.outlined.exit.exitStub:
 | |
| ; CHECK1-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK1-LABEL: define {{[^@]+}}@.omp_outlined.
 | |
| ; CHECK1-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK1-NEXT:  entry:
 | |
| ; CHECK1-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK1-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK1-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK1-LABEL: define {{[^@]+}}@.omp_outlined..1
 | |
| ; CHECK1-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK1-NEXT:  entry:
 | |
| ; CHECK1-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK1-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK1-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK1-LABEL: define {{[^@]+}}@unmergable_proc_bind
 | |
| ; CHECK1-SAME: (i32 [[A:%.*]]) local_unnamed_addr {
 | |
| ; CHECK1-NEXT:  entry:
 | |
| ; CHECK1-NEXT:    [[A_ADDR:%.*]] = alloca i32, align 4
 | |
| ; CHECK1-NEXT:    [[TMP0:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1:[0-9]+]])
 | |
| ; CHECK1-NEXT:    store i32 [[A]], i32* [[A_ADDR]], align 4
 | |
| ; CHECK1-NEXT:    call void @__kmpc_push_proc_bind(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]], i32 [[TMP0]], i32 noundef 3)
 | |
| ; CHECK1-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]], i32 noundef 1, void (i32*, i32*, ...)* noundef bitcast (void (i32*, i32*, i32*)* @.omp_outlined..2 to void (i32*, i32*, ...)*), i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK1-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]], i32 noundef 1, void (i32*, i32*, ...)* noundef bitcast (void (i32*, i32*, i32*)* @.omp_outlined..3 to void (i32*, i32*, ...)*), i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK1-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK1-LABEL: define {{[^@]+}}@.omp_outlined..2
 | |
| ; CHECK1-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK1-NEXT:  entry:
 | |
| ; CHECK1-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK1-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK1-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK1-LABEL: define {{[^@]+}}@.omp_outlined..3
 | |
| ; CHECK1-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK1-NEXT:  entry:
 | |
| ; CHECK1-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK1-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK1-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK1-LABEL: define {{[^@]+}}@unmergable_num_threads
 | |
| ; CHECK1-SAME: (i32 [[A:%.*]]) local_unnamed_addr {
 | |
| ; CHECK1-NEXT:  entry:
 | |
| ; CHECK1-NEXT:    [[A_ADDR:%.*]] = alloca i32, align 4
 | |
| ; CHECK1-NEXT:    [[TMP0:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]])
 | |
| ; CHECK1-NEXT:    store i32 [[A]], i32* [[A_ADDR]], align 4
 | |
| ; CHECK1-NEXT:    call void @__kmpc_push_num_threads(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]], i32 [[TMP0]], i32 [[A]])
 | |
| ; CHECK1-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]], i32 noundef 1, void (i32*, i32*, ...)* noundef bitcast (void (i32*, i32*, i32*)* @.omp_outlined..4 to void (i32*, i32*, ...)*), i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK1-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]], i32 noundef 1, void (i32*, i32*, ...)* noundef bitcast (void (i32*, i32*, i32*)* @.omp_outlined..5 to void (i32*, i32*, ...)*), i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK1-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK1-LABEL: define {{[^@]+}}@.omp_outlined..4
 | |
| ; CHECK1-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK1-NEXT:  entry:
 | |
| ; CHECK1-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK1-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK1-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK1-LABEL: define {{[^@]+}}@.omp_outlined..5
 | |
| ; CHECK1-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK1-NEXT:  entry:
 | |
| ; CHECK1-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK1-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK1-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK1-LABEL: define {{[^@]+}}@unmergable_seq_call
 | |
| ; CHECK1-SAME: (i32 [[A:%.*]]) local_unnamed_addr {
 | |
| ; CHECK1-NEXT:  entry:
 | |
| ; CHECK1-NEXT:    [[A_ADDR:%.*]] = alloca i32, align 4
 | |
| ; CHECK1-NEXT:    store i32 [[A]], i32* [[A_ADDR]], align 4
 | |
| ; CHECK1-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]], i32 noundef 1, void (i32*, i32*, ...)* noundef bitcast (void (i32*, i32*, i32*)* @.omp_outlined..6 to void (i32*, i32*, ...)*), i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK1-NEXT:    call void (...) @foo()
 | |
| ; CHECK1-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]], i32 noundef 1, void (i32*, i32*, ...)* noundef bitcast (void (i32*, i32*, i32*)* @.omp_outlined..7 to void (i32*, i32*, ...)*), i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK1-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK1-LABEL: define {{[^@]+}}@.omp_outlined..6
 | |
| ; CHECK1-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK1-NEXT:  entry:
 | |
| ; CHECK1-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK1-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK1-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK1-LABEL: define {{[^@]+}}@.omp_outlined..7
 | |
| ; CHECK1-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK1-NEXT:  entry:
 | |
| ; CHECK1-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK1-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK1-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK1-LABEL: define {{[^@]+}}@merge_seq
 | |
| ; CHECK1-SAME: (i32 [[A:%.*]]) local_unnamed_addr {
 | |
| ; CHECK1-NEXT:  entry:
 | |
| ; CHECK1-NEXT:    [[STRUCTARG:%.*]] = alloca { i32* }, align 8
 | |
| ; CHECK1-NEXT:    [[A_ADDR:%.*]] = alloca i32, align 4
 | |
| ; CHECK1-NEXT:    store i32 [[A]], i32* [[A_ADDR]], align 4
 | |
| ; CHECK1-NEXT:    [[OMP_GLOBAL_THREAD_NUM2:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB2]])
 | |
| ; CHECK1-NEXT:    br label [[OMP_PARALLEL:%.*]]
 | |
| ; CHECK1:       omp_parallel:
 | |
| ; CHECK1-NEXT:    [[GEP_A_ADDR:%.*]] = getelementptr { i32* }, { i32* }* [[STRUCTARG]], i32 0, i32 0
 | |
| ; CHECK1-NEXT:    store i32* [[A_ADDR]], i32** [[GEP_A_ADDR]], align 8
 | |
| ; CHECK1-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB2]], i32 1, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, { i32* }*)* @merge_seq..omp_par to void (i32*, i32*, ...)*), { i32* }* [[STRUCTARG]])
 | |
| ; CHECK1-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT:%.*]]
 | |
| ; CHECK1:       omp.par.outlined.exit:
 | |
| ; CHECK1-NEXT:    br label [[OMP_PAR_EXIT_SPLIT:%.*]]
 | |
| ; CHECK1:       omp.par.exit.split:
 | |
| ; CHECK1-NEXT:    br label [[ENTRY_SPLIT_SPLIT:%.*]]
 | |
| ; CHECK1:       entry.split.split:
 | |
| ; CHECK1-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A_ADDR]], align 4
 | |
| ; CHECK1-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK1-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK1-LABEL: define {{[^@]+}}@merge_seq..omp_par
 | |
| ; CHECK1-SAME: (i32* noalias [[TID_ADDR:%.*]], i32* noalias [[ZERO_ADDR:%.*]], { i32* }* [[TMP0:%.*]]) #[[ATTR0]] {
 | |
| ; CHECK1-NEXT:  omp.par.entry:
 | |
| ; CHECK1-NEXT:    [[GEP_A_ADDR:%.*]] = getelementptr { i32* }, { i32* }* [[TMP0]], i32 0, i32 0
 | |
| ; CHECK1-NEXT:    [[LOADGEP_A_ADDR:%.*]] = load i32*, i32** [[GEP_A_ADDR]], align 8
 | |
| ; CHECK1-NEXT:    [[TID_ADDR_LOCAL:%.*]] = alloca i32, align 4
 | |
| ; CHECK1-NEXT:    [[TMP1:%.*]] = load i32, i32* [[TID_ADDR]], align 4
 | |
| ; CHECK1-NEXT:    store i32 [[TMP1]], i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK1-NEXT:    [[TID:%.*]] = load i32, i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK1-NEXT:    br label [[OMP_PAR_REGION:%.*]]
 | |
| ; CHECK1:       omp.par.region:
 | |
| ; CHECK1-NEXT:    br label [[OMP_PAR_MERGED:%.*]]
 | |
| ; CHECK1:       omp.par.merged:
 | |
| ; CHECK1-NEXT:    call void (i32*, i32*, ...) bitcast (void (i32*, i32*, i32*)* @.omp_outlined..8 to void (i32*, i32*, ...)*)(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[LOADGEP_A_ADDR]])
 | |
| ; CHECK1-NEXT:    [[OMP_GLOBAL_THREAD_NUM2:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB2]])
 | |
| ; CHECK1-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB3]], i32 [[OMP_GLOBAL_THREAD_NUM2]])
 | |
| ; CHECK1-NEXT:    [[OMP_GLOBAL_THREAD_NUM:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB2]])
 | |
| ; CHECK1-NEXT:    [[TMP2:%.*]] = call i32 @__kmpc_master(%struct.ident_t* @[[GLOB2]], i32 [[OMP_GLOBAL_THREAD_NUM]])
 | |
| ; CHECK1-NEXT:    [[TMP3:%.*]] = icmp ne i32 [[TMP2]], 0
 | |
| ; CHECK1-NEXT:    br i1 [[TMP3]], label [[OMP_REGION_BODY:%.*]], label [[OMP_REGION_END:%.*]]
 | |
| ; CHECK1:       omp_region.end:
 | |
| ; CHECK1-NEXT:    [[OMP_GLOBAL_THREAD_NUM1:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB2]])
 | |
| ; CHECK1-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB3]], i32 [[OMP_GLOBAL_THREAD_NUM1]])
 | |
| ; CHECK1-NEXT:    br label [[OMP_PAR_MERGED_SPLIT_SPLIT:%.*]]
 | |
| ; CHECK1:       omp.par.merged.split.split:
 | |
| ; CHECK1-NEXT:    call void (i32*, i32*, ...) bitcast (void (i32*, i32*, i32*)* @.omp_outlined..9 to void (i32*, i32*, ...)*)(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[LOADGEP_A_ADDR]])
 | |
| ; CHECK1-NEXT:    br label [[ENTRY_SPLIT:%.*]]
 | |
| ; CHECK1:       entry.split:
 | |
| ; CHECK1-NEXT:    br label [[OMP_PAR_REGION_SPLIT:%.*]]
 | |
| ; CHECK1:       omp.par.region.split:
 | |
| ; CHECK1-NEXT:    br label [[OMP_PAR_PRE_FINALIZE:%.*]]
 | |
| ; CHECK1:       omp.par.pre_finalize:
 | |
| ; CHECK1-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT_EXITSTUB:%.*]]
 | |
| ; CHECK1:       omp_region.body:
 | |
| ; CHECK1-NEXT:    br label [[SEQ_PAR_MERGED:%.*]]
 | |
| ; CHECK1:       seq.par.merged:
 | |
| ; CHECK1-NEXT:    [[TMP4:%.*]] = load i32, i32* [[LOADGEP_A_ADDR]], align 4
 | |
| ; CHECK1-NEXT:    [[ADD:%.*]] = add nsw i32 [[TMP4]], 1
 | |
| ; CHECK1-NEXT:    store i32 [[ADD]], i32* [[LOADGEP_A_ADDR]], align 4
 | |
| ; CHECK1-NEXT:    br label [[OMP_PAR_MERGED_SPLIT:%.*]]
 | |
| ; CHECK1:       omp.par.merged.split:
 | |
| ; CHECK1-NEXT:    br label [[OMP_REGION_BODY_SPLIT:%.*]]
 | |
| ; CHECK1:       omp_region.body.split:
 | |
| ; CHECK1-NEXT:    call void @__kmpc_end_master(%struct.ident_t* @[[GLOB2]], i32 [[OMP_GLOBAL_THREAD_NUM]])
 | |
| ; CHECK1-NEXT:    br label [[OMP_REGION_END]]
 | |
| ; CHECK1:       omp.par.outlined.exit.exitStub:
 | |
| ; CHECK1-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK1-LABEL: define {{[^@]+}}@.omp_outlined..8
 | |
| ; CHECK1-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK1-NEXT:  entry:
 | |
| ; CHECK1-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK1-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK1-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK1-LABEL: define {{[^@]+}}@.omp_outlined..9
 | |
| ; CHECK1-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK1-NEXT:  entry:
 | |
| ; CHECK1-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK1-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK1-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK1-LABEL: define {{[^@]+}}@merge_seq_float
 | |
| ; CHECK1-SAME: (float [[F:%.*]], float* nocapture nofree writeonly [[P:%.*]]) local_unnamed_addr {
 | |
| ; CHECK1-NEXT:  entry:
 | |
| ; CHECK1-NEXT:    [[STRUCTARG:%.*]] = alloca { float*, float*, float* }, align 8
 | |
| ; CHECK1-NEXT:    [[F_RELOADED:%.*]] = alloca float, align 4
 | |
| ; CHECK1-NEXT:    [[F_ADDR:%.*]] = alloca float, align 4
 | |
| ; CHECK1-NEXT:    store float [[F]], float* [[F_ADDR]], align 4
 | |
| ; CHECK1-NEXT:    [[OMP_GLOBAL_THREAD_NUM2:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB2]])
 | |
| ; CHECK1-NEXT:    store float [[F]], float* [[F_RELOADED]], align 4
 | |
| ; CHECK1-NEXT:    br label [[OMP_PARALLEL:%.*]]
 | |
| ; CHECK1:       omp_parallel:
 | |
| ; CHECK1-NEXT:    [[GEP_F_RELOADED:%.*]] = getelementptr { float*, float*, float* }, { float*, float*, float* }* [[STRUCTARG]], i32 0, i32 0
 | |
| ; CHECK1-NEXT:    store float* [[F_RELOADED]], float** [[GEP_F_RELOADED]], align 8
 | |
| ; CHECK1-NEXT:    [[GEP_F_ADDR:%.*]] = getelementptr { float*, float*, float* }, { float*, float*, float* }* [[STRUCTARG]], i32 0, i32 1
 | |
| ; CHECK1-NEXT:    store float* [[F_ADDR]], float** [[GEP_F_ADDR]], align 8
 | |
| ; CHECK1-NEXT:    [[GEP_P:%.*]] = getelementptr { float*, float*, float* }, { float*, float*, float* }* [[STRUCTARG]], i32 0, i32 2
 | |
| ; CHECK1-NEXT:    store float* [[P]], float** [[GEP_P]], align 8
 | |
| ; CHECK1-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB2]], i32 1, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, { float*, float*, float* }*)* @merge_seq_float..omp_par to void (i32*, i32*, ...)*), { float*, float*, float* }* [[STRUCTARG]])
 | |
| ; CHECK1-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT:%.*]]
 | |
| ; CHECK1:       omp.par.outlined.exit:
 | |
| ; CHECK1-NEXT:    br label [[OMP_PAR_EXIT_SPLIT:%.*]]
 | |
| ; CHECK1:       omp.par.exit.split:
 | |
| ; CHECK1-NEXT:    br label [[ENTRY_SPLIT_SPLIT:%.*]]
 | |
| ; CHECK1:       entry.split.split:
 | |
| ; CHECK1-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK1-LABEL: define {{[^@]+}}@merge_seq_float..omp_par
 | |
| ; CHECK1-SAME: (i32* noalias [[TID_ADDR:%.*]], i32* noalias [[ZERO_ADDR:%.*]], { float*, float*, float* }* [[TMP0:%.*]]) #[[ATTR0]] {
 | |
| ; CHECK1-NEXT:  omp.par.entry:
 | |
| ; CHECK1-NEXT:    [[GEP_F_RELOADED:%.*]] = getelementptr { float*, float*, float* }, { float*, float*, float* }* [[TMP0]], i32 0, i32 0
 | |
| ; CHECK1-NEXT:    [[LOADGEP_F_RELOADED:%.*]] = load float*, float** [[GEP_F_RELOADED]], align 8
 | |
| ; CHECK1-NEXT:    [[GEP_F_ADDR:%.*]] = getelementptr { float*, float*, float* }, { float*, float*, float* }* [[TMP0]], i32 0, i32 1
 | |
| ; CHECK1-NEXT:    [[LOADGEP_F_ADDR:%.*]] = load float*, float** [[GEP_F_ADDR]], align 8
 | |
| ; CHECK1-NEXT:    [[GEP_P:%.*]] = getelementptr { float*, float*, float* }, { float*, float*, float* }* [[TMP0]], i32 0, i32 2
 | |
| ; CHECK1-NEXT:    [[LOADGEP_P:%.*]] = load float*, float** [[GEP_P]], align 8
 | |
| ; CHECK1-NEXT:    [[TID_ADDR_LOCAL:%.*]] = alloca i32, align 4
 | |
| ; CHECK1-NEXT:    [[TMP1:%.*]] = load i32, i32* [[TID_ADDR]], align 4
 | |
| ; CHECK1-NEXT:    store i32 [[TMP1]], i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK1-NEXT:    [[TID:%.*]] = load i32, i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK1-NEXT:    [[TMP2:%.*]] = load float, float* [[LOADGEP_F_RELOADED]], align 4
 | |
| ; CHECK1-NEXT:    br label [[OMP_PAR_REGION:%.*]]
 | |
| ; CHECK1:       omp.par.region:
 | |
| ; CHECK1-NEXT:    br label [[OMP_PAR_MERGED:%.*]]
 | |
| ; CHECK1:       omp.par.merged:
 | |
| ; CHECK1-NEXT:    call void (i32*, i32*, ...) bitcast (void (i32*, i32*, float*)* @.omp_outlined..10 to void (i32*, i32*, ...)*)(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], float* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[LOADGEP_F_ADDR]])
 | |
| ; CHECK1-NEXT:    [[OMP_GLOBAL_THREAD_NUM2:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB2]])
 | |
| ; CHECK1-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB3]], i32 [[OMP_GLOBAL_THREAD_NUM2]])
 | |
| ; CHECK1-NEXT:    [[OMP_GLOBAL_THREAD_NUM:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB2]])
 | |
| ; CHECK1-NEXT:    [[TMP3:%.*]] = call i32 @__kmpc_master(%struct.ident_t* @[[GLOB2]], i32 [[OMP_GLOBAL_THREAD_NUM]])
 | |
| ; CHECK1-NEXT:    [[TMP4:%.*]] = icmp ne i32 [[TMP3]], 0
 | |
| ; CHECK1-NEXT:    br i1 [[TMP4]], label [[OMP_REGION_BODY:%.*]], label [[OMP_REGION_END:%.*]]
 | |
| ; CHECK1:       omp_region.end:
 | |
| ; CHECK1-NEXT:    [[OMP_GLOBAL_THREAD_NUM1:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB2]])
 | |
| ; CHECK1-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB3]], i32 [[OMP_GLOBAL_THREAD_NUM1]])
 | |
| ; CHECK1-NEXT:    br label [[OMP_PAR_MERGED_SPLIT_SPLIT:%.*]]
 | |
| ; CHECK1:       omp.par.merged.split.split:
 | |
| ; CHECK1-NEXT:    call void (i32*, i32*, ...) bitcast (void (i32*, i32*, float*)* @.omp_outlined..11 to void (i32*, i32*, ...)*)(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], float* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[LOADGEP_F_ADDR]])
 | |
| ; CHECK1-NEXT:    br label [[ENTRY_SPLIT:%.*]]
 | |
| ; CHECK1:       entry.split:
 | |
| ; CHECK1-NEXT:    br label [[OMP_PAR_REGION_SPLIT:%.*]]
 | |
| ; CHECK1:       omp.par.region.split:
 | |
| ; CHECK1-NEXT:    br label [[OMP_PAR_PRE_FINALIZE:%.*]]
 | |
| ; CHECK1:       omp.par.pre_finalize:
 | |
| ; CHECK1-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT_EXITSTUB:%.*]]
 | |
| ; CHECK1:       omp_region.body:
 | |
| ; CHECK1-NEXT:    br label [[SEQ_PAR_MERGED:%.*]]
 | |
| ; CHECK1:       seq.par.merged:
 | |
| ; CHECK1-NEXT:    [[ADD:%.*]] = fadd float [[TMP2]], 0x40091EB860000000
 | |
| ; CHECK1-NEXT:    store float [[ADD]], float* [[LOADGEP_P]], align 4
 | |
| ; CHECK1-NEXT:    br label [[OMP_PAR_MERGED_SPLIT:%.*]]
 | |
| ; CHECK1:       omp.par.merged.split:
 | |
| ; CHECK1-NEXT:    br label [[OMP_REGION_BODY_SPLIT:%.*]]
 | |
| ; CHECK1:       omp_region.body.split:
 | |
| ; CHECK1-NEXT:    call void @__kmpc_end_master(%struct.ident_t* @[[GLOB2]], i32 [[OMP_GLOBAL_THREAD_NUM]])
 | |
| ; CHECK1-NEXT:    br label [[OMP_REGION_END]]
 | |
| ; CHECK1:       omp.par.outlined.exit.exitStub:
 | |
| ; CHECK1-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK1-LABEL: define {{[^@]+}}@.omp_outlined..10
 | |
| ; CHECK1-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], float* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[F:%.*]]) {
 | |
| ; CHECK1-NEXT:  entry:
 | |
| ; CHECK1-NEXT:    [[TMP0:%.*]] = load float, float* [[F]], align 4
 | |
| ; CHECK1-NEXT:    [[CONV:%.*]] = fptosi float [[TMP0]] to i32
 | |
| ; CHECK1-NEXT:    call void @use(i32 [[CONV]])
 | |
| ; CHECK1-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK1-LABEL: define {{[^@]+}}@.omp_outlined..11
 | |
| ; CHECK1-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], float* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[F:%.*]]) {
 | |
| ; CHECK1-NEXT:  entry:
 | |
| ; CHECK1-NEXT:    [[TMP0:%.*]] = load float, float* [[F]], align 4
 | |
| ; CHECK1-NEXT:    [[CONV:%.*]] = fptosi float [[TMP0]] to i32
 | |
| ; CHECK1-NEXT:    call void @use(i32 [[CONV]])
 | |
| ; CHECK1-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK1-LABEL: define {{[^@]+}}@merge_seq_firstprivate
 | |
| ; CHECK1-SAME: (i32 [[A:%.*]]) local_unnamed_addr {
 | |
| ; CHECK1-NEXT:  entry:
 | |
| ; CHECK1-NEXT:    [[STRUCTARG:%.*]] = alloca { i32*, i64* }, align 8
 | |
| ; CHECK1-NEXT:    [[A_CASTED_SROA_0_0_INSERT_EXT_SEQ_OUTPUT_ALLOC:%.*]] = alloca i64, align 8
 | |
| ; CHECK1-NEXT:    [[A_ADDR:%.*]] = alloca i32, align 4
 | |
| ; CHECK1-NEXT:    store i32 [[A]], i32* [[A_ADDR]], align 4
 | |
| ; CHECK1-NEXT:    [[OMP_GLOBAL_THREAD_NUM2:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB2]])
 | |
| ; CHECK1-NEXT:    br label [[OMP_PARALLEL:%.*]]
 | |
| ; CHECK1:       omp_parallel:
 | |
| ; CHECK1-NEXT:    [[GEP_A_ADDR:%.*]] = getelementptr { i32*, i64* }, { i32*, i64* }* [[STRUCTARG]], i32 0, i32 0
 | |
| ; CHECK1-NEXT:    store i32* [[A_ADDR]], i32** [[GEP_A_ADDR]], align 8
 | |
| ; CHECK1-NEXT:    [[GEP_A_CASTED_SROA_0_0_INSERT_EXT_SEQ_OUTPUT_ALLOC:%.*]] = getelementptr { i32*, i64* }, { i32*, i64* }* [[STRUCTARG]], i32 0, i32 1
 | |
| ; CHECK1-NEXT:    store i64* [[A_CASTED_SROA_0_0_INSERT_EXT_SEQ_OUTPUT_ALLOC]], i64** [[GEP_A_CASTED_SROA_0_0_INSERT_EXT_SEQ_OUTPUT_ALLOC]], align 8
 | |
| ; CHECK1-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB2]], i32 1, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, { i32*, i64* }*)* @merge_seq_firstprivate..omp_par to void (i32*, i32*, ...)*), { i32*, i64* }* [[STRUCTARG]])
 | |
| ; CHECK1-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT:%.*]]
 | |
| ; CHECK1:       omp.par.outlined.exit:
 | |
| ; CHECK1-NEXT:    br label [[OMP_PAR_EXIT_SPLIT:%.*]]
 | |
| ; CHECK1:       omp.par.exit.split:
 | |
| ; CHECK1-NEXT:    br label [[ENTRY_SPLIT_SPLIT:%.*]]
 | |
| ; CHECK1:       entry.split.split:
 | |
| ; CHECK1-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A_ADDR]], align 4
 | |
| ; CHECK1-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK1-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK1-LABEL: define {{[^@]+}}@merge_seq_firstprivate..omp_par
 | |
| ; CHECK1-SAME: (i32* noalias [[TID_ADDR:%.*]], i32* noalias [[ZERO_ADDR:%.*]], { i32*, i64* }* [[TMP0:%.*]]) #[[ATTR0]] {
 | |
| ; CHECK1-NEXT:  omp.par.entry:
 | |
| ; CHECK1-NEXT:    [[GEP_A_ADDR:%.*]] = getelementptr { i32*, i64* }, { i32*, i64* }* [[TMP0]], i32 0, i32 0
 | |
| ; CHECK1-NEXT:    [[LOADGEP_A_ADDR:%.*]] = load i32*, i32** [[GEP_A_ADDR]], align 8
 | |
| ; CHECK1-NEXT:    [[GEP_A_CASTED_SROA_0_0_INSERT_EXT_SEQ_OUTPUT_ALLOC:%.*]] = getelementptr { i32*, i64* }, { i32*, i64* }* [[TMP0]], i32 0, i32 1
 | |
| ; CHECK1-NEXT:    [[LOADGEP_A_CASTED_SROA_0_0_INSERT_EXT_SEQ_OUTPUT_ALLOC:%.*]] = load i64*, i64** [[GEP_A_CASTED_SROA_0_0_INSERT_EXT_SEQ_OUTPUT_ALLOC]], align 8
 | |
| ; CHECK1-NEXT:    [[TID_ADDR_LOCAL:%.*]] = alloca i32, align 4
 | |
| ; CHECK1-NEXT:    [[TMP1:%.*]] = load i32, i32* [[TID_ADDR]], align 4
 | |
| ; CHECK1-NEXT:    store i32 [[TMP1]], i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK1-NEXT:    [[TID:%.*]] = load i32, i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK1-NEXT:    br label [[OMP_PAR_REGION:%.*]]
 | |
| ; CHECK1:       omp.par.region:
 | |
| ; CHECK1-NEXT:    br label [[OMP_PAR_MERGED:%.*]]
 | |
| ; CHECK1:       omp.par.merged:
 | |
| ; CHECK1-NEXT:    call void (i32*, i32*, ...) bitcast (void (i32*, i32*, i32*)* @.omp_outlined..12 to void (i32*, i32*, ...)*)(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[LOADGEP_A_ADDR]])
 | |
| ; CHECK1-NEXT:    [[OMP_GLOBAL_THREAD_NUM2:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB2]])
 | |
| ; CHECK1-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB3]], i32 [[OMP_GLOBAL_THREAD_NUM2]])
 | |
| ; CHECK1-NEXT:    [[OMP_GLOBAL_THREAD_NUM:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB2]])
 | |
| ; CHECK1-NEXT:    [[TMP2:%.*]] = call i32 @__kmpc_master(%struct.ident_t* @[[GLOB2]], i32 [[OMP_GLOBAL_THREAD_NUM]])
 | |
| ; CHECK1-NEXT:    [[TMP3:%.*]] = icmp ne i32 [[TMP2]], 0
 | |
| ; CHECK1-NEXT:    br i1 [[TMP3]], label [[OMP_REGION_BODY:%.*]], label [[OMP_REGION_END:%.*]]
 | |
| ; CHECK1:       omp_region.end:
 | |
| ; CHECK1-NEXT:    [[OMP_GLOBAL_THREAD_NUM1:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB2]])
 | |
| ; CHECK1-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB3]], i32 [[OMP_GLOBAL_THREAD_NUM1]])
 | |
| ; CHECK1-NEXT:    br label [[OMP_PAR_MERGED_SPLIT_SPLIT:%.*]]
 | |
| ; CHECK1:       omp.par.merged.split.split:
 | |
| ; CHECK1-NEXT:    [[A_CASTED_SROA_0_0_INSERT_EXT_SEQ_OUTPUT_LOAD:%.*]] = load i64, i64* [[LOADGEP_A_CASTED_SROA_0_0_INSERT_EXT_SEQ_OUTPUT_ALLOC]], align 8
 | |
| ; CHECK1-NEXT:    call void (i32*, i32*, ...) bitcast (void (i32*, i32*, i64)* @.omp_outlined..13 to void (i32*, i32*, ...)*)(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i64 [[A_CASTED_SROA_0_0_INSERT_EXT_SEQ_OUTPUT_LOAD]])
 | |
| ; CHECK1-NEXT:    br label [[ENTRY_SPLIT:%.*]]
 | |
| ; CHECK1:       entry.split:
 | |
| ; CHECK1-NEXT:    br label [[OMP_PAR_REGION_SPLIT:%.*]]
 | |
| ; CHECK1:       omp.par.region.split:
 | |
| ; CHECK1-NEXT:    br label [[OMP_PAR_PRE_FINALIZE:%.*]]
 | |
| ; CHECK1:       omp.par.pre_finalize:
 | |
| ; CHECK1-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT_EXITSTUB:%.*]]
 | |
| ; CHECK1:       omp_region.body:
 | |
| ; CHECK1-NEXT:    br label [[SEQ_PAR_MERGED:%.*]]
 | |
| ; CHECK1:       seq.par.merged:
 | |
| ; CHECK1-NEXT:    [[TMP4:%.*]] = load i32, i32* [[LOADGEP_A_ADDR]], align 4
 | |
| ; CHECK1-NEXT:    [[ADD:%.*]] = add nsw i32 [[TMP4]], 1
 | |
| ; CHECK1-NEXT:    store i32 [[ADD]], i32* [[LOADGEP_A_ADDR]], align 4
 | |
| ; CHECK1-NEXT:    [[A_CASTED_SROA_0_0_INSERT_EXT:%.*]] = zext i32 [[ADD]] to i64
 | |
| ; CHECK1-NEXT:    store i64 [[A_CASTED_SROA_0_0_INSERT_EXT]], i64* [[LOADGEP_A_CASTED_SROA_0_0_INSERT_EXT_SEQ_OUTPUT_ALLOC]], align 8
 | |
| ; CHECK1-NEXT:    br label [[OMP_PAR_MERGED_SPLIT:%.*]]
 | |
| ; CHECK1:       omp.par.merged.split:
 | |
| ; CHECK1-NEXT:    br label [[OMP_REGION_BODY_SPLIT:%.*]]
 | |
| ; CHECK1:       omp_region.body.split:
 | |
| ; CHECK1-NEXT:    call void @__kmpc_end_master(%struct.ident_t* @[[GLOB2]], i32 [[OMP_GLOBAL_THREAD_NUM]])
 | |
| ; CHECK1-NEXT:    br label [[OMP_REGION_END]]
 | |
| ; CHECK1:       omp.par.outlined.exit.exitStub:
 | |
| ; CHECK1-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK1-LABEL: define {{[^@]+}}@.omp_outlined..12
 | |
| ; CHECK1-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK1-NEXT:  entry:
 | |
| ; CHECK1-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK1-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK1-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK1-LABEL: define {{[^@]+}}@.omp_outlined..13
 | |
| ; CHECK1-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i64 [[A:%.*]]) {
 | |
| ; CHECK1-NEXT:  entry:
 | |
| ; CHECK1-NEXT:    [[A_ADDR_SROA_0_0_EXTRACT_TRUNC:%.*]] = trunc i64 [[A]] to i32
 | |
| ; CHECK1-NEXT:    call void @use(i32 [[A_ADDR_SROA_0_0_EXTRACT_TRUNC]])
 | |
| ; CHECK1-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK1-LABEL: define {{[^@]+}}@merge_seq_sink_lt
 | |
| ; CHECK1-SAME: (i32 [[A:%.*]]) local_unnamed_addr {
 | |
| ; CHECK1-NEXT:  entry:
 | |
| ; CHECK1-NEXT:    [[STRUCTARG:%.*]] = alloca { i32* }, align 8
 | |
| ; CHECK1-NEXT:    [[A_ADDR:%.*]] = alloca i32, align 4
 | |
| ; CHECK1-NEXT:    store i32 [[A]], i32* [[A_ADDR]], align 4
 | |
| ; CHECK1-NEXT:    [[OMP_GLOBAL_THREAD_NUM2:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB2]])
 | |
| ; CHECK1-NEXT:    br label [[OMP_PARALLEL:%.*]]
 | |
| ; CHECK1:       omp_parallel:
 | |
| ; CHECK1-NEXT:    [[GEP_A_ADDR:%.*]] = getelementptr { i32* }, { i32* }* [[STRUCTARG]], i32 0, i32 0
 | |
| ; CHECK1-NEXT:    store i32* [[A_ADDR]], i32** [[GEP_A_ADDR]], align 8
 | |
| ; CHECK1-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB2]], i32 1, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, { i32* }*)* @merge_seq_sink_lt..omp_par to void (i32*, i32*, ...)*), { i32* }* [[STRUCTARG]])
 | |
| ; CHECK1-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT:%.*]]
 | |
| ; CHECK1:       omp.par.outlined.exit:
 | |
| ; CHECK1-NEXT:    br label [[OMP_PAR_EXIT_SPLIT:%.*]]
 | |
| ; CHECK1:       omp.par.exit.split:
 | |
| ; CHECK1-NEXT:    br label [[ENTRY_SPLIT_SPLIT:%.*]]
 | |
| ; CHECK1:       entry.split.split:
 | |
| ; CHECK1-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK1-LABEL: define {{[^@]+}}@merge_seq_sink_lt..omp_par
 | |
| ; CHECK1-SAME: (i32* noalias [[TID_ADDR:%.*]], i32* noalias [[ZERO_ADDR:%.*]], { i32* }* [[TMP0:%.*]]) #[[ATTR0]] {
 | |
| ; CHECK1-NEXT:  omp.par.entry:
 | |
| ; CHECK1-NEXT:    [[B:%.*]] = alloca i32, align 4
 | |
| ; CHECK1-NEXT:    [[GEP_A_ADDR:%.*]] = getelementptr { i32* }, { i32* }* [[TMP0]], i32 0, i32 0
 | |
| ; CHECK1-NEXT:    [[LOADGEP_A_ADDR:%.*]] = load i32*, i32** [[GEP_A_ADDR]], align 8
 | |
| ; CHECK1-NEXT:    [[TID_ADDR_LOCAL:%.*]] = alloca i32, align 4
 | |
| ; CHECK1-NEXT:    [[TMP1:%.*]] = load i32, i32* [[TID_ADDR]], align 4
 | |
| ; CHECK1-NEXT:    store i32 [[TMP1]], i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK1-NEXT:    [[TID:%.*]] = load i32, i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK1-NEXT:    br label [[OMP_PAR_REGION:%.*]]
 | |
| ; CHECK1:       omp.par.region:
 | |
| ; CHECK1-NEXT:    br label [[OMP_PAR_MERGED:%.*]]
 | |
| ; CHECK1:       omp.par.merged:
 | |
| ; CHECK1-NEXT:    call void (i32*, i32*, ...) bitcast (void (i32*, i32*, i32*)* @.omp_outlined..14 to void (i32*, i32*, ...)*)(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[LOADGEP_A_ADDR]])
 | |
| ; CHECK1-NEXT:    [[OMP_GLOBAL_THREAD_NUM2:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB2]])
 | |
| ; CHECK1-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB3]], i32 [[OMP_GLOBAL_THREAD_NUM2]])
 | |
| ; CHECK1-NEXT:    [[OMP_GLOBAL_THREAD_NUM:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB2]])
 | |
| ; CHECK1-NEXT:    [[TMP2:%.*]] = call i32 @__kmpc_master(%struct.ident_t* @[[GLOB2]], i32 [[OMP_GLOBAL_THREAD_NUM]])
 | |
| ; CHECK1-NEXT:    [[TMP3:%.*]] = icmp ne i32 [[TMP2]], 0
 | |
| ; CHECK1-NEXT:    br i1 [[TMP3]], label [[OMP_REGION_BODY:%.*]], label [[OMP_REGION_END:%.*]]
 | |
| ; CHECK1:       omp_region.end:
 | |
| ; CHECK1-NEXT:    [[OMP_GLOBAL_THREAD_NUM1:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB2]])
 | |
| ; CHECK1-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB3]], i32 [[OMP_GLOBAL_THREAD_NUM1]])
 | |
| ; CHECK1-NEXT:    br label [[OMP_PAR_MERGED_SPLIT_SPLIT:%.*]]
 | |
| ; CHECK1:       omp.par.merged.split.split:
 | |
| ; CHECK1-NEXT:    call void (i32*, i32*, ...) bitcast (void (i32*, i32*, i32*)* @.omp_outlined..15 to void (i32*, i32*, ...)*)(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[LOADGEP_A_ADDR]])
 | |
| ; CHECK1-NEXT:    br label [[ENTRY_SPLIT:%.*]]
 | |
| ; CHECK1:       entry.split:
 | |
| ; CHECK1-NEXT:    br label [[OMP_PAR_REGION_SPLIT:%.*]]
 | |
| ; CHECK1:       omp.par.region.split:
 | |
| ; CHECK1-NEXT:    br label [[OMP_PAR_PRE_FINALIZE:%.*]]
 | |
| ; CHECK1:       omp.par.pre_finalize:
 | |
| ; CHECK1-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT_EXITSTUB:%.*]]
 | |
| ; CHECK1:       omp_region.body:
 | |
| ; CHECK1-NEXT:    br label [[SEQ_PAR_MERGED:%.*]]
 | |
| ; CHECK1:       seq.par.merged:
 | |
| ; CHECK1-NEXT:    [[TMP4:%.*]] = bitcast i32* [[B]] to i8*
 | |
| ; CHECK1-NEXT:    call void @llvm.lifetime.start.p0i8(i64 noundef 4, i8* noundef nonnull [[TMP4]])
 | |
| ; CHECK1-NEXT:    [[TMP5:%.*]] = ptrtoint i32* [[B]] to i64
 | |
| ; CHECK1-NEXT:    [[TMP6:%.*]] = trunc i64 [[TMP5]] to i32
 | |
| ; CHECK1-NEXT:    call void @llvm.lifetime.end.p0i8(i64 noundef 4, i8* noundef nonnull [[TMP4]])
 | |
| ; CHECK1-NEXT:    br label [[OMP_PAR_MERGED_SPLIT:%.*]]
 | |
| ; CHECK1:       omp.par.merged.split:
 | |
| ; CHECK1-NEXT:    br label [[OMP_REGION_BODY_SPLIT:%.*]]
 | |
| ; CHECK1:       omp_region.body.split:
 | |
| ; CHECK1-NEXT:    call void @__kmpc_end_master(%struct.ident_t* @[[GLOB2]], i32 [[OMP_GLOBAL_THREAD_NUM]])
 | |
| ; CHECK1-NEXT:    br label [[OMP_REGION_END]]
 | |
| ; CHECK1:       omp.par.outlined.exit.exitStub:
 | |
| ; CHECK1-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK1-LABEL: define {{[^@]+}}@.omp_outlined..14
 | |
| ; CHECK1-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK1-NEXT:  entry:
 | |
| ; CHECK1-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK1-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK1-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK1-LABEL: define {{[^@]+}}@.omp_outlined..15
 | |
| ; CHECK1-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK1-NEXT:  entry:
 | |
| ; CHECK1-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK1-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK1-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK1-LABEL: define {{[^@]+}}@merge_seq_par_use
 | |
| ; CHECK1-SAME: (i32 [[A:%.*]]) local_unnamed_addr {
 | |
| ; CHECK1-NEXT:  entry:
 | |
| ; CHECK1-NEXT:    [[STRUCTARG:%.*]] = alloca { i32*, i32*, i32* }, align 8
 | |
| ; CHECK1-NEXT:    [[A_RELOADED:%.*]] = alloca i32, align 4
 | |
| ; CHECK1-NEXT:    [[A_ADDR:%.*]] = alloca i32, align 4
 | |
| ; CHECK1-NEXT:    [[B:%.*]] = alloca i32, align 4
 | |
| ; CHECK1-NEXT:    store i32 [[A]], i32* [[A_ADDR]], align 4
 | |
| ; CHECK1-NEXT:    [[OMP_GLOBAL_THREAD_NUM2:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB2]])
 | |
| ; CHECK1-NEXT:    store i32 [[A]], i32* [[A_RELOADED]], align 4
 | |
| ; CHECK1-NEXT:    br label [[OMP_PARALLEL:%.*]]
 | |
| ; CHECK1:       omp_parallel:
 | |
| ; CHECK1-NEXT:    [[GEP_A_RELOADED:%.*]] = getelementptr { i32*, i32*, i32* }, { i32*, i32*, i32* }* [[STRUCTARG]], i32 0, i32 0
 | |
| ; CHECK1-NEXT:    store i32* [[A_RELOADED]], i32** [[GEP_A_RELOADED]], align 8
 | |
| ; CHECK1-NEXT:    [[GEP_A_ADDR:%.*]] = getelementptr { i32*, i32*, i32* }, { i32*, i32*, i32* }* [[STRUCTARG]], i32 0, i32 1
 | |
| ; CHECK1-NEXT:    store i32* [[A_ADDR]], i32** [[GEP_A_ADDR]], align 8
 | |
| ; CHECK1-NEXT:    [[GEP_B:%.*]] = getelementptr { i32*, i32*, i32* }, { i32*, i32*, i32* }* [[STRUCTARG]], i32 0, i32 2
 | |
| ; CHECK1-NEXT:    store i32* [[B]], i32** [[GEP_B]], align 8
 | |
| ; CHECK1-NEXT:    [[LT_CAST3:%.*]] = bitcast i32* [[B]] to i8*
 | |
| ; CHECK1-NEXT:    call void @llvm.lifetime.start.p0i8(i64 -1, i8* [[LT_CAST3]])
 | |
| ; CHECK1-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB2]], i32 1, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, { i32*, i32*, i32* }*)* @merge_seq_par_use..omp_par to void (i32*, i32*, ...)*), { i32*, i32*, i32* }* [[STRUCTARG]])
 | |
| ; CHECK1-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT:%.*]]
 | |
| ; CHECK1:       omp.par.outlined.exit:
 | |
| ; CHECK1-NEXT:    br label [[OMP_PAR_EXIT_SPLIT:%.*]]
 | |
| ; CHECK1:       omp.par.exit.split:
 | |
| ; CHECK1-NEXT:    br label [[ENTRY_SPLIT_SPLIT:%.*]]
 | |
| ; CHECK1:       entry.split.split:
 | |
| ; CHECK1-NEXT:    [[LT_CAST:%.*]] = bitcast i32* [[B]] to i8*
 | |
| ; CHECK1-NEXT:    call void @llvm.lifetime.end.p0i8(i64 noundef 4, i8* noundef nonnull [[LT_CAST]])
 | |
| ; CHECK1-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK1-LABEL: define {{[^@]+}}@merge_seq_par_use..omp_par
 | |
| ; CHECK1-SAME: (i32* noalias [[TID_ADDR:%.*]], i32* noalias [[ZERO_ADDR:%.*]], { i32*, i32*, i32* }* [[TMP0:%.*]]) #[[ATTR0]] {
 | |
| ; CHECK1-NEXT:  omp.par.entry:
 | |
| ; CHECK1-NEXT:    [[GEP_A_RELOADED:%.*]] = getelementptr { i32*, i32*, i32* }, { i32*, i32*, i32* }* [[TMP0]], i32 0, i32 0
 | |
| ; CHECK1-NEXT:    [[LOADGEP_A_RELOADED:%.*]] = load i32*, i32** [[GEP_A_RELOADED]], align 8
 | |
| ; CHECK1-NEXT:    [[GEP_A_ADDR:%.*]] = getelementptr { i32*, i32*, i32* }, { i32*, i32*, i32* }* [[TMP0]], i32 0, i32 1
 | |
| ; CHECK1-NEXT:    [[LOADGEP_A_ADDR:%.*]] = load i32*, i32** [[GEP_A_ADDR]], align 8
 | |
| ; CHECK1-NEXT:    [[GEP_B:%.*]] = getelementptr { i32*, i32*, i32* }, { i32*, i32*, i32* }* [[TMP0]], i32 0, i32 2
 | |
| ; CHECK1-NEXT:    [[LOADGEP_B:%.*]] = load i32*, i32** [[GEP_B]], align 8
 | |
| ; CHECK1-NEXT:    [[TID_ADDR_LOCAL:%.*]] = alloca i32, align 4
 | |
| ; CHECK1-NEXT:    [[TMP1:%.*]] = load i32, i32* [[TID_ADDR]], align 4
 | |
| ; CHECK1-NEXT:    store i32 [[TMP1]], i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK1-NEXT:    [[TID:%.*]] = load i32, i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK1-NEXT:    [[TMP2:%.*]] = load i32, i32* [[LOADGEP_A_RELOADED]], align 4
 | |
| ; CHECK1-NEXT:    br label [[OMP_PAR_REGION:%.*]]
 | |
| ; CHECK1:       omp.par.region:
 | |
| ; CHECK1-NEXT:    br label [[OMP_PAR_MERGED:%.*]]
 | |
| ; CHECK1:       omp.par.merged:
 | |
| ; CHECK1-NEXT:    call void (i32*, i32*, ...) bitcast (void (i32*, i32*, i32*)* @.omp_outlined..16 to void (i32*, i32*, ...)*)(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[LOADGEP_A_ADDR]])
 | |
| ; CHECK1-NEXT:    [[OMP_GLOBAL_THREAD_NUM2:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB2]])
 | |
| ; CHECK1-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB3]], i32 [[OMP_GLOBAL_THREAD_NUM2]])
 | |
| ; CHECK1-NEXT:    [[OMP_GLOBAL_THREAD_NUM:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB2]])
 | |
| ; CHECK1-NEXT:    [[TMP3:%.*]] = call i32 @__kmpc_master(%struct.ident_t* @[[GLOB2]], i32 [[OMP_GLOBAL_THREAD_NUM]])
 | |
| ; CHECK1-NEXT:    [[TMP4:%.*]] = icmp ne i32 [[TMP3]], 0
 | |
| ; CHECK1-NEXT:    br i1 [[TMP4]], label [[OMP_REGION_BODY:%.*]], label [[OMP_REGION_END:%.*]]
 | |
| ; CHECK1:       omp_region.end:
 | |
| ; CHECK1-NEXT:    [[OMP_GLOBAL_THREAD_NUM1:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB2]])
 | |
| ; CHECK1-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB3]], i32 [[OMP_GLOBAL_THREAD_NUM1]])
 | |
| ; CHECK1-NEXT:    br label [[OMP_PAR_MERGED_SPLIT_SPLIT:%.*]]
 | |
| ; CHECK1:       omp.par.merged.split.split:
 | |
| ; CHECK1-NEXT:    call void (i32*, i32*, ...) bitcast (void (i32*, i32*, i32*, i32*)* @.omp_outlined..17 to void (i32*, i32*, ...)*)(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[LOADGEP_A_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[LOADGEP_B]])
 | |
| ; CHECK1-NEXT:    br label [[ENTRY_SPLIT:%.*]]
 | |
| ; CHECK1:       entry.split:
 | |
| ; CHECK1-NEXT:    br label [[OMP_PAR_REGION_SPLIT:%.*]]
 | |
| ; CHECK1:       omp.par.region.split:
 | |
| ; CHECK1-NEXT:    br label [[OMP_PAR_PRE_FINALIZE:%.*]]
 | |
| ; CHECK1:       omp.par.pre_finalize:
 | |
| ; CHECK1-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT_EXITSTUB:%.*]]
 | |
| ; CHECK1:       omp_region.body:
 | |
| ; CHECK1-NEXT:    br label [[SEQ_PAR_MERGED:%.*]]
 | |
| ; CHECK1:       seq.par.merged:
 | |
| ; CHECK1-NEXT:    [[TMP5:%.*]] = bitcast i32* [[LOADGEP_B]] to i8*
 | |
| ; CHECK1-NEXT:    [[ADD:%.*]] = add nsw i32 [[TMP2]], 1
 | |
| ; CHECK1-NEXT:    store i32 [[ADD]], i32* [[LOADGEP_B]], align 4
 | |
| ; CHECK1-NEXT:    br label [[OMP_PAR_MERGED_SPLIT:%.*]]
 | |
| ; CHECK1:       omp.par.merged.split:
 | |
| ; CHECK1-NEXT:    br label [[OMP_REGION_BODY_SPLIT:%.*]]
 | |
| ; CHECK1:       omp_region.body.split:
 | |
| ; CHECK1-NEXT:    call void @__kmpc_end_master(%struct.ident_t* @[[GLOB2]], i32 [[OMP_GLOBAL_THREAD_NUM]])
 | |
| ; CHECK1-NEXT:    br label [[OMP_REGION_END]]
 | |
| ; CHECK1:       omp.par.outlined.exit.exitStub:
 | |
| ; CHECK1-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK1-LABEL: define {{[^@]+}}@.omp_outlined..16
 | |
| ; CHECK1-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK1-NEXT:  entry:
 | |
| ; CHECK1-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK1-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK1-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK1-LABEL: define {{[^@]+}}@.omp_outlined..17
 | |
| ; CHECK1-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[B:%.*]]) {
 | |
| ; CHECK1-NEXT:  entry:
 | |
| ; CHECK1-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK1-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK1-NEXT:    [[TMP1:%.*]] = load i32, i32* [[B]], align 4
 | |
| ; CHECK1-NEXT:    call void @use(i32 [[TMP1]])
 | |
| ; CHECK1-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK1-LABEL: define {{[^@]+}}@merge_cancellable_regions
 | |
| ; CHECK1-SAME: (i32 [[CANCEL1:%.*]], i32 [[CANCEL2:%.*]]) local_unnamed_addr {
 | |
| ; CHECK1-NEXT:  entry:
 | |
| ; CHECK1-NEXT:    [[STRUCTARG:%.*]] = alloca { i32*, i32* }, align 8
 | |
| ; CHECK1-NEXT:    [[CANCEL1_ADDR:%.*]] = alloca i32, align 4
 | |
| ; CHECK1-NEXT:    [[CANCEL2_ADDR:%.*]] = alloca i32, align 4
 | |
| ; CHECK1-NEXT:    store i32 [[CANCEL1]], i32* [[CANCEL1_ADDR]], align 4
 | |
| ; CHECK1-NEXT:    store i32 [[CANCEL2]], i32* [[CANCEL2_ADDR]], align 4
 | |
| ; CHECK1-NEXT:    [[OMP_GLOBAL_THREAD_NUM:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB2]])
 | |
| ; CHECK1-NEXT:    br label [[OMP_PARALLEL:%.*]]
 | |
| ; CHECK1:       omp_parallel:
 | |
| ; CHECK1-NEXT:    [[GEP_CANCEL1_ADDR:%.*]] = getelementptr { i32*, i32* }, { i32*, i32* }* [[STRUCTARG]], i32 0, i32 0
 | |
| ; CHECK1-NEXT:    store i32* [[CANCEL1_ADDR]], i32** [[GEP_CANCEL1_ADDR]], align 8
 | |
| ; CHECK1-NEXT:    [[GEP_CANCEL2_ADDR:%.*]] = getelementptr { i32*, i32* }, { i32*, i32* }* [[STRUCTARG]], i32 0, i32 1
 | |
| ; CHECK1-NEXT:    store i32* [[CANCEL2_ADDR]], i32** [[GEP_CANCEL2_ADDR]], align 8
 | |
| ; CHECK1-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB2]], i32 1, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, { i32*, i32* }*)* @merge_cancellable_regions..omp_par to void (i32*, i32*, ...)*), { i32*, i32* }* [[STRUCTARG]])
 | |
| ; CHECK1-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT:%.*]]
 | |
| ; CHECK1:       omp.par.outlined.exit:
 | |
| ; CHECK1-NEXT:    br label [[OMP_PAR_EXIT_SPLIT:%.*]]
 | |
| ; CHECK1:       omp.par.exit.split:
 | |
| ; CHECK1-NEXT:    br label [[ENTRY_SPLIT_SPLIT:%.*]]
 | |
| ; CHECK1:       entry.split.split:
 | |
| ; CHECK1-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK1-LABEL: define {{[^@]+}}@merge_cancellable_regions..omp_par
 | |
| ; CHECK1-SAME: (i32* noalias [[TID_ADDR:%.*]], i32* noalias [[ZERO_ADDR:%.*]], { i32*, i32* }* [[TMP0:%.*]]) #[[ATTR0]] {
 | |
| ; CHECK1-NEXT:  omp.par.entry:
 | |
| ; CHECK1-NEXT:    [[GEP_CANCEL1_ADDR:%.*]] = getelementptr { i32*, i32* }, { i32*, i32* }* [[TMP0]], i32 0, i32 0
 | |
| ; CHECK1-NEXT:    [[LOADGEP_CANCEL1_ADDR:%.*]] = load i32*, i32** [[GEP_CANCEL1_ADDR]], align 8
 | |
| ; CHECK1-NEXT:    [[GEP_CANCEL2_ADDR:%.*]] = getelementptr { i32*, i32* }, { i32*, i32* }* [[TMP0]], i32 0, i32 1
 | |
| ; CHECK1-NEXT:    [[LOADGEP_CANCEL2_ADDR:%.*]] = load i32*, i32** [[GEP_CANCEL2_ADDR]], align 8
 | |
| ; CHECK1-NEXT:    [[TID_ADDR_LOCAL:%.*]] = alloca i32, align 4
 | |
| ; CHECK1-NEXT:    [[TMP1:%.*]] = load i32, i32* [[TID_ADDR]], align 4
 | |
| ; CHECK1-NEXT:    store i32 [[TMP1]], i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK1-NEXT:    [[TID:%.*]] = load i32, i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK1-NEXT:    br label [[OMP_PAR_REGION:%.*]]
 | |
| ; CHECK1:       omp.par.region:
 | |
| ; CHECK1-NEXT:    br label [[OMP_PAR_MERGED:%.*]]
 | |
| ; CHECK1:       omp.par.merged:
 | |
| ; CHECK1-NEXT:    call void (i32*, i32*, ...) bitcast (void (i32*, i32*, i32*)* @.omp_outlined..18 to void (i32*, i32*, ...)*)(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[LOADGEP_CANCEL1_ADDR]])
 | |
| ; CHECK1-NEXT:    [[OMP_GLOBAL_THREAD_NUM:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB2]])
 | |
| ; CHECK1-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB3]], i32 [[OMP_GLOBAL_THREAD_NUM]])
 | |
| ; CHECK1-NEXT:    call void (i32*, i32*, ...) bitcast (void (i32*, i32*, i32*)* @.omp_outlined..19 to void (i32*, i32*, ...)*)(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[LOADGEP_CANCEL2_ADDR]])
 | |
| ; CHECK1-NEXT:    br label [[ENTRY_SPLIT:%.*]]
 | |
| ; CHECK1:       entry.split:
 | |
| ; CHECK1-NEXT:    br label [[OMP_PAR_REGION_SPLIT:%.*]]
 | |
| ; CHECK1:       omp.par.region.split:
 | |
| ; CHECK1-NEXT:    br label [[OMP_PAR_PRE_FINALIZE:%.*]]
 | |
| ; CHECK1:       omp.par.pre_finalize:
 | |
| ; CHECK1-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT_EXITSTUB:%.*]]
 | |
| ; CHECK1:       omp.par.outlined.exit.exitStub:
 | |
| ; CHECK1-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK1-LABEL: define {{[^@]+}}@.omp_outlined..18
 | |
| ; CHECK1-SAME: (i32* noalias nocapture nofree readonly [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[CANCEL1:%.*]]) {
 | |
| ; CHECK1-NEXT:  entry:
 | |
| ; CHECK1-NEXT:    [[TMP0:%.*]] = load i32, i32* [[CANCEL1]], align 4
 | |
| ; CHECK1-NEXT:    [[TOBOOL_NOT:%.*]] = icmp eq i32 [[TMP0]], 0
 | |
| ; CHECK1-NEXT:    br i1 [[TOBOOL_NOT]], label [[IF_END:%.*]], label [[IF_THEN:%.*]]
 | |
| ; CHECK1:       if.then:
 | |
| ; CHECK1-NEXT:    [[TMP1:%.*]] = load i32, i32* [[DOTGLOBAL_TID_]], align 4
 | |
| ; CHECK1-NEXT:    [[TMP2:%.*]] = call i32 @__kmpc_cancel(%struct.ident_t* noundef nonnull @[[GLOB1]], i32 [[TMP1]], i32 noundef 1)
 | |
| ; CHECK1-NEXT:    ret void
 | |
| ; CHECK1:       if.end:
 | |
| ; CHECK1-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK1-LABEL: define {{[^@]+}}@.omp_outlined..19
 | |
| ; CHECK1-SAME: (i32* noalias nocapture nofree readonly [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[CANCEL2:%.*]]) {
 | |
| ; CHECK1-NEXT:  entry:
 | |
| ; CHECK1-NEXT:    [[TMP0:%.*]] = load i32, i32* [[CANCEL2]], align 4
 | |
| ; CHECK1-NEXT:    [[TOBOOL_NOT:%.*]] = icmp eq i32 [[TMP0]], 0
 | |
| ; CHECK1-NEXT:    br i1 [[TOBOOL_NOT]], label [[IF_END:%.*]], label [[IF_THEN:%.*]]
 | |
| ; CHECK1:       if.then:
 | |
| ; CHECK1-NEXT:    [[TMP1:%.*]] = load i32, i32* [[DOTGLOBAL_TID_]], align 4
 | |
| ; CHECK1-NEXT:    [[TMP2:%.*]] = call i32 @__kmpc_cancel(%struct.ident_t* noundef nonnull @[[GLOB1]], i32 [[TMP1]], i32 noundef 1)
 | |
| ; CHECK1-NEXT:    ret void
 | |
| ; CHECK1:       if.end:
 | |
| ; CHECK1-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK1-LABEL: define {{[^@]+}}@merge_cancellable_regions_seq
 | |
| ; CHECK1-SAME: (i32 [[CANCEL1:%.*]], i32 [[CANCEL2:%.*]]) local_unnamed_addr {
 | |
| ; CHECK1-NEXT:  entry:
 | |
| ; CHECK1-NEXT:    [[STRUCTARG:%.*]] = alloca { i32*, i32*, i32* }, align 8
 | |
| ; CHECK1-NEXT:    [[CANCEL1_RELOADED:%.*]] = alloca i32, align 4
 | |
| ; CHECK1-NEXT:    [[CANCEL1_ADDR:%.*]] = alloca i32, align 4
 | |
| ; CHECK1-NEXT:    [[CANCEL2_ADDR:%.*]] = alloca i32, align 4
 | |
| ; CHECK1-NEXT:    store i32 [[CANCEL1]], i32* [[CANCEL1_ADDR]], align 4
 | |
| ; CHECK1-NEXT:    store i32 [[CANCEL2]], i32* [[CANCEL2_ADDR]], align 4
 | |
| ; CHECK1-NEXT:    [[OMP_GLOBAL_THREAD_NUM2:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB2]])
 | |
| ; CHECK1-NEXT:    store i32 [[CANCEL1]], i32* [[CANCEL1_RELOADED]], align 4
 | |
| ; CHECK1-NEXT:    br label [[OMP_PARALLEL:%.*]]
 | |
| ; CHECK1:       omp_parallel:
 | |
| ; CHECK1-NEXT:    [[GEP_CANCEL1_RELOADED:%.*]] = getelementptr { i32*, i32*, i32* }, { i32*, i32*, i32* }* [[STRUCTARG]], i32 0, i32 0
 | |
| ; CHECK1-NEXT:    store i32* [[CANCEL1_RELOADED]], i32** [[GEP_CANCEL1_RELOADED]], align 8
 | |
| ; CHECK1-NEXT:    [[GEP_CANCEL1_ADDR:%.*]] = getelementptr { i32*, i32*, i32* }, { i32*, i32*, i32* }* [[STRUCTARG]], i32 0, i32 1
 | |
| ; CHECK1-NEXT:    store i32* [[CANCEL1_ADDR]], i32** [[GEP_CANCEL1_ADDR]], align 8
 | |
| ; CHECK1-NEXT:    [[GEP_CANCEL2_ADDR:%.*]] = getelementptr { i32*, i32*, i32* }, { i32*, i32*, i32* }* [[STRUCTARG]], i32 0, i32 2
 | |
| ; CHECK1-NEXT:    store i32* [[CANCEL2_ADDR]], i32** [[GEP_CANCEL2_ADDR]], align 8
 | |
| ; CHECK1-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB2]], i32 1, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, { i32*, i32*, i32* }*)* @merge_cancellable_regions_seq..omp_par to void (i32*, i32*, ...)*), { i32*, i32*, i32* }* [[STRUCTARG]])
 | |
| ; CHECK1-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT:%.*]]
 | |
| ; CHECK1:       omp.par.outlined.exit:
 | |
| ; CHECK1-NEXT:    br label [[OMP_PAR_EXIT_SPLIT:%.*]]
 | |
| ; CHECK1:       omp.par.exit.split:
 | |
| ; CHECK1-NEXT:    br label [[ENTRY_SPLIT_SPLIT:%.*]]
 | |
| ; CHECK1:       entry.split.split:
 | |
| ; CHECK1-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK1-LABEL: define {{[^@]+}}@merge_cancellable_regions_seq..omp_par
 | |
| ; CHECK1-SAME: (i32* noalias [[TID_ADDR:%.*]], i32* noalias [[ZERO_ADDR:%.*]], { i32*, i32*, i32* }* [[TMP0:%.*]]) #[[ATTR0]] {
 | |
| ; CHECK1-NEXT:  omp.par.entry:
 | |
| ; CHECK1-NEXT:    [[GEP_CANCEL1_RELOADED:%.*]] = getelementptr { i32*, i32*, i32* }, { i32*, i32*, i32* }* [[TMP0]], i32 0, i32 0
 | |
| ; CHECK1-NEXT:    [[LOADGEP_CANCEL1_RELOADED:%.*]] = load i32*, i32** [[GEP_CANCEL1_RELOADED]], align 8
 | |
| ; CHECK1-NEXT:    [[GEP_CANCEL1_ADDR:%.*]] = getelementptr { i32*, i32*, i32* }, { i32*, i32*, i32* }* [[TMP0]], i32 0, i32 1
 | |
| ; CHECK1-NEXT:    [[LOADGEP_CANCEL1_ADDR:%.*]] = load i32*, i32** [[GEP_CANCEL1_ADDR]], align 8
 | |
| ; CHECK1-NEXT:    [[GEP_CANCEL2_ADDR:%.*]] = getelementptr { i32*, i32*, i32* }, { i32*, i32*, i32* }* [[TMP0]], i32 0, i32 2
 | |
| ; CHECK1-NEXT:    [[LOADGEP_CANCEL2_ADDR:%.*]] = load i32*, i32** [[GEP_CANCEL2_ADDR]], align 8
 | |
| ; CHECK1-NEXT:    [[TID_ADDR_LOCAL:%.*]] = alloca i32, align 4
 | |
| ; CHECK1-NEXT:    [[TMP1:%.*]] = load i32, i32* [[TID_ADDR]], align 4
 | |
| ; CHECK1-NEXT:    store i32 [[TMP1]], i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK1-NEXT:    [[TID:%.*]] = load i32, i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK1-NEXT:    [[TMP2:%.*]] = load i32, i32* [[LOADGEP_CANCEL1_RELOADED]], align 4
 | |
| ; CHECK1-NEXT:    br label [[OMP_PAR_REGION:%.*]]
 | |
| ; CHECK1:       omp.par.region:
 | |
| ; CHECK1-NEXT:    br label [[OMP_PAR_MERGED:%.*]]
 | |
| ; CHECK1:       omp.par.merged:
 | |
| ; CHECK1-NEXT:    call void (i32*, i32*, ...) bitcast (void (i32*, i32*, i32*)* @.omp_outlined..20 to void (i32*, i32*, ...)*)(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[LOADGEP_CANCEL1_ADDR]])
 | |
| ; CHECK1-NEXT:    [[OMP_GLOBAL_THREAD_NUM2:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB2]])
 | |
| ; CHECK1-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB3]], i32 [[OMP_GLOBAL_THREAD_NUM2]])
 | |
| ; CHECK1-NEXT:    [[OMP_GLOBAL_THREAD_NUM:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB2]])
 | |
| ; CHECK1-NEXT:    [[TMP3:%.*]] = call i32 @__kmpc_master(%struct.ident_t* @[[GLOB2]], i32 [[OMP_GLOBAL_THREAD_NUM]])
 | |
| ; CHECK1-NEXT:    [[TMP4:%.*]] = icmp ne i32 [[TMP3]], 0
 | |
| ; CHECK1-NEXT:    br i1 [[TMP4]], label [[OMP_REGION_BODY:%.*]], label [[OMP_REGION_END:%.*]]
 | |
| ; CHECK1:       omp_region.end:
 | |
| ; CHECK1-NEXT:    [[OMP_GLOBAL_THREAD_NUM1:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB2]])
 | |
| ; CHECK1-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB3]], i32 [[OMP_GLOBAL_THREAD_NUM1]])
 | |
| ; CHECK1-NEXT:    br label [[OMP_PAR_MERGED_SPLIT_SPLIT:%.*]]
 | |
| ; CHECK1:       omp.par.merged.split.split:
 | |
| ; CHECK1-NEXT:    call void (i32*, i32*, ...) bitcast (void (i32*, i32*, i32*)* @.omp_outlined..21 to void (i32*, i32*, ...)*)(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[LOADGEP_CANCEL2_ADDR]])
 | |
| ; CHECK1-NEXT:    br label [[ENTRY_SPLIT:%.*]]
 | |
| ; CHECK1:       entry.split:
 | |
| ; CHECK1-NEXT:    br label [[OMP_PAR_REGION_SPLIT:%.*]]
 | |
| ; CHECK1:       omp.par.region.split:
 | |
| ; CHECK1-NEXT:    br label [[OMP_PAR_PRE_FINALIZE:%.*]]
 | |
| ; CHECK1:       omp.par.pre_finalize:
 | |
| ; CHECK1-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT_EXITSTUB:%.*]]
 | |
| ; CHECK1:       omp_region.body:
 | |
| ; CHECK1-NEXT:    br label [[SEQ_PAR_MERGED:%.*]]
 | |
| ; CHECK1:       seq.par.merged:
 | |
| ; CHECK1-NEXT:    [[TOBOOL_NOT:%.*]] = icmp eq i32 [[TMP2]], 0
 | |
| ; CHECK1-NEXT:    [[LNOT_EXT:%.*]] = zext i1 [[TOBOOL_NOT]] to i32
 | |
| ; CHECK1-NEXT:    store i32 [[LNOT_EXT]], i32* [[LOADGEP_CANCEL2_ADDR]], align 4
 | |
| ; CHECK1-NEXT:    br label [[OMP_PAR_MERGED_SPLIT:%.*]]
 | |
| ; CHECK1:       omp.par.merged.split:
 | |
| ; CHECK1-NEXT:    br label [[OMP_REGION_BODY_SPLIT:%.*]]
 | |
| ; CHECK1:       omp_region.body.split:
 | |
| ; CHECK1-NEXT:    call void @__kmpc_end_master(%struct.ident_t* @[[GLOB2]], i32 [[OMP_GLOBAL_THREAD_NUM]])
 | |
| ; CHECK1-NEXT:    br label [[OMP_REGION_END]]
 | |
| ; CHECK1:       omp.par.outlined.exit.exitStub:
 | |
| ; CHECK1-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK1-LABEL: define {{[^@]+}}@.omp_outlined..20
 | |
| ; CHECK1-SAME: (i32* noalias nocapture nofree readonly [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[CANCEL1:%.*]]) {
 | |
| ; CHECK1-NEXT:  entry:
 | |
| ; CHECK1-NEXT:    [[TMP0:%.*]] = load i32, i32* [[CANCEL1]], align 4
 | |
| ; CHECK1-NEXT:    [[TOBOOL_NOT:%.*]] = icmp eq i32 [[TMP0]], 0
 | |
| ; CHECK1-NEXT:    br i1 [[TOBOOL_NOT]], label [[IF_END:%.*]], label [[IF_THEN:%.*]]
 | |
| ; CHECK1:       if.then:
 | |
| ; CHECK1-NEXT:    [[TMP1:%.*]] = load i32, i32* [[DOTGLOBAL_TID_]], align 4
 | |
| ; CHECK1-NEXT:    [[TMP2:%.*]] = call i32 @__kmpc_cancel(%struct.ident_t* noundef nonnull @[[GLOB1]], i32 [[TMP1]], i32 noundef 1)
 | |
| ; CHECK1-NEXT:    ret void
 | |
| ; CHECK1:       if.end:
 | |
| ; CHECK1-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK1-LABEL: define {{[^@]+}}@.omp_outlined..21
 | |
| ; CHECK1-SAME: (i32* noalias nocapture nofree readonly [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[CANCEL2:%.*]]) {
 | |
| ; CHECK1-NEXT:  entry:
 | |
| ; CHECK1-NEXT:    [[TMP0:%.*]] = load i32, i32* [[CANCEL2]], align 4
 | |
| ; CHECK1-NEXT:    [[TOBOOL_NOT:%.*]] = icmp eq i32 [[TMP0]], 0
 | |
| ; CHECK1-NEXT:    br i1 [[TOBOOL_NOT]], label [[IF_END:%.*]], label [[IF_THEN:%.*]]
 | |
| ; CHECK1:       if.then:
 | |
| ; CHECK1-NEXT:    [[TMP1:%.*]] = load i32, i32* [[DOTGLOBAL_TID_]], align 4
 | |
| ; CHECK1-NEXT:    [[TMP2:%.*]] = call i32 @__kmpc_cancel(%struct.ident_t* noundef nonnull @[[GLOB1]], i32 [[TMP1]], i32 noundef 1)
 | |
| ; CHECK1-NEXT:    ret void
 | |
| ; CHECK1:       if.end:
 | |
| ; CHECK1-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK1-LABEL: define {{[^@]+}}@merge_3
 | |
| ; CHECK1-SAME: (i32 [[A:%.*]]) local_unnamed_addr {
 | |
| ; CHECK1-NEXT:  entry:
 | |
| ; CHECK1-NEXT:    [[STRUCTARG:%.*]] = alloca { i32* }, align 8
 | |
| ; CHECK1-NEXT:    [[A_ADDR:%.*]] = alloca i32, align 4
 | |
| ; CHECK1-NEXT:    store i32 [[A]], i32* [[A_ADDR]], align 4
 | |
| ; CHECK1-NEXT:    [[OMP_GLOBAL_THREAD_NUM:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB2]])
 | |
| ; CHECK1-NEXT:    br label [[OMP_PARALLEL:%.*]]
 | |
| ; CHECK1:       omp_parallel:
 | |
| ; CHECK1-NEXT:    [[GEP_A_ADDR:%.*]] = getelementptr { i32* }, { i32* }* [[STRUCTARG]], i32 0, i32 0
 | |
| ; CHECK1-NEXT:    store i32* [[A_ADDR]], i32** [[GEP_A_ADDR]], align 8
 | |
| ; CHECK1-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB2]], i32 1, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, { i32* }*)* @merge_3..omp_par to void (i32*, i32*, ...)*), { i32* }* [[STRUCTARG]])
 | |
| ; CHECK1-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT:%.*]]
 | |
| ; CHECK1:       omp.par.outlined.exit:
 | |
| ; CHECK1-NEXT:    br label [[OMP_PAR_EXIT_SPLIT:%.*]]
 | |
| ; CHECK1:       omp.par.exit.split:
 | |
| ; CHECK1-NEXT:    br label [[ENTRY_SPLIT_SPLIT:%.*]]
 | |
| ; CHECK1:       entry.split.split:
 | |
| ; CHECK1-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK1-LABEL: define {{[^@]+}}@merge_3..omp_par
 | |
| ; CHECK1-SAME: (i32* noalias [[TID_ADDR:%.*]], i32* noalias [[ZERO_ADDR:%.*]], { i32* }* [[TMP0:%.*]]) #[[ATTR0]] {
 | |
| ; CHECK1-NEXT:  omp.par.entry:
 | |
| ; CHECK1-NEXT:    [[GEP_A_ADDR:%.*]] = getelementptr { i32* }, { i32* }* [[TMP0]], i32 0, i32 0
 | |
| ; CHECK1-NEXT:    [[LOADGEP_A_ADDR:%.*]] = load i32*, i32** [[GEP_A_ADDR]], align 8
 | |
| ; CHECK1-NEXT:    [[TID_ADDR_LOCAL:%.*]] = alloca i32, align 4
 | |
| ; CHECK1-NEXT:    [[TMP1:%.*]] = load i32, i32* [[TID_ADDR]], align 4
 | |
| ; CHECK1-NEXT:    store i32 [[TMP1]], i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK1-NEXT:    [[TID:%.*]] = load i32, i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK1-NEXT:    br label [[OMP_PAR_REGION:%.*]]
 | |
| ; CHECK1:       omp.par.region:
 | |
| ; CHECK1-NEXT:    br label [[OMP_PAR_MERGED:%.*]]
 | |
| ; CHECK1:       omp.par.merged:
 | |
| ; CHECK1-NEXT:    call void (i32*, i32*, ...) bitcast (void (i32*, i32*, i32*)* @.omp_outlined..22 to void (i32*, i32*, ...)*)(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[LOADGEP_A_ADDR]])
 | |
| ; CHECK1-NEXT:    [[OMP_GLOBAL_THREAD_NUM:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB2]])
 | |
| ; CHECK1-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB3]], i32 [[OMP_GLOBAL_THREAD_NUM]])
 | |
| ; CHECK1-NEXT:    call void (i32*, i32*, ...) bitcast (void (i32*, i32*, i32*)* @.omp_outlined..23 to void (i32*, i32*, ...)*)(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[LOADGEP_A_ADDR]])
 | |
| ; CHECK1-NEXT:    [[OMP_GLOBAL_THREAD_NUM1:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB2]])
 | |
| ; CHECK1-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB3]], i32 [[OMP_GLOBAL_THREAD_NUM1]])
 | |
| ; CHECK1-NEXT:    call void (i32*, i32*, ...) bitcast (void (i32*, i32*, i32*)* @.omp_outlined..24 to void (i32*, i32*, ...)*)(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[LOADGEP_A_ADDR]])
 | |
| ; CHECK1-NEXT:    br label [[ENTRY_SPLIT:%.*]]
 | |
| ; CHECK1:       entry.split:
 | |
| ; CHECK1-NEXT:    br label [[OMP_PAR_REGION_SPLIT:%.*]]
 | |
| ; CHECK1:       omp.par.region.split:
 | |
| ; CHECK1-NEXT:    br label [[OMP_PAR_PRE_FINALIZE:%.*]]
 | |
| ; CHECK1:       omp.par.pre_finalize:
 | |
| ; CHECK1-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT_EXITSTUB:%.*]]
 | |
| ; CHECK1:       omp.par.outlined.exit.exitStub:
 | |
| ; CHECK1-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK1-LABEL: define {{[^@]+}}@.omp_outlined..22
 | |
| ; CHECK1-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK1-NEXT:  entry:
 | |
| ; CHECK1-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK1-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK1-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK1-LABEL: define {{[^@]+}}@.omp_outlined..23
 | |
| ; CHECK1-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK1-NEXT:  entry:
 | |
| ; CHECK1-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK1-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK1-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK1-LABEL: define {{[^@]+}}@.omp_outlined..24
 | |
| ; CHECK1-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK1-NEXT:  entry:
 | |
| ; CHECK1-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK1-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK1-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK1-LABEL: define {{[^@]+}}@merge_3_seq
 | |
| ; CHECK1-SAME: (i32 [[A:%.*]], i32 [[B:%.*]]) local_unnamed_addr {
 | |
| ; CHECK1-NEXT:  entry:
 | |
| ; CHECK1-NEXT:    [[STRUCTARG:%.*]] = alloca { i32*, i32*, i32*, i32* }, align 8
 | |
| ; CHECK1-NEXT:    [[A_RELOADED:%.*]] = alloca i32, align 4
 | |
| ; CHECK1-NEXT:    [[ADD1_SEQ_OUTPUT_ALLOC:%.*]] = alloca i32, align 4
 | |
| ; CHECK1-NEXT:    [[ADD_SEQ_OUTPUT_ALLOC:%.*]] = alloca i32, align 4
 | |
| ; CHECK1-NEXT:    [[A_ADDR:%.*]] = alloca i32, align 4
 | |
| ; CHECK1-NEXT:    store i32 [[A]], i32* [[A_ADDR]], align 4
 | |
| ; CHECK1-NEXT:    [[OMP_GLOBAL_THREAD_NUM7:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB2]])
 | |
| ; CHECK1-NEXT:    store i32 [[A]], i32* [[A_RELOADED]], align 4
 | |
| ; CHECK1-NEXT:    br label [[OMP_PARALLEL:%.*]]
 | |
| ; CHECK1:       omp_parallel:
 | |
| ; CHECK1-NEXT:    [[GEP_A_RELOADED:%.*]] = getelementptr { i32*, i32*, i32*, i32* }, { i32*, i32*, i32*, i32* }* [[STRUCTARG]], i32 0, i32 0
 | |
| ; CHECK1-NEXT:    store i32* [[A_RELOADED]], i32** [[GEP_A_RELOADED]], align 8
 | |
| ; CHECK1-NEXT:    [[GEP_A_ADDR:%.*]] = getelementptr { i32*, i32*, i32*, i32* }, { i32*, i32*, i32*, i32* }* [[STRUCTARG]], i32 0, i32 1
 | |
| ; CHECK1-NEXT:    store i32* [[A_ADDR]], i32** [[GEP_A_ADDR]], align 8
 | |
| ; CHECK1-NEXT:    [[GEP_ADD_SEQ_OUTPUT_ALLOC:%.*]] = getelementptr { i32*, i32*, i32*, i32* }, { i32*, i32*, i32*, i32* }* [[STRUCTARG]], i32 0, i32 2
 | |
| ; CHECK1-NEXT:    store i32* [[ADD_SEQ_OUTPUT_ALLOC]], i32** [[GEP_ADD_SEQ_OUTPUT_ALLOC]], align 8
 | |
| ; CHECK1-NEXT:    [[GEP_ADD1_SEQ_OUTPUT_ALLOC:%.*]] = getelementptr { i32*, i32*, i32*, i32* }, { i32*, i32*, i32*, i32* }* [[STRUCTARG]], i32 0, i32 3
 | |
| ; CHECK1-NEXT:    store i32* [[ADD1_SEQ_OUTPUT_ALLOC]], i32** [[GEP_ADD1_SEQ_OUTPUT_ALLOC]], align 8
 | |
| ; CHECK1-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB2]], i32 1, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, { i32*, i32*, i32*, i32* }*)* @merge_3_seq..omp_par to void (i32*, i32*, ...)*), { i32*, i32*, i32*, i32* }* [[STRUCTARG]])
 | |
| ; CHECK1-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT:%.*]]
 | |
| ; CHECK1:       omp.par.outlined.exit:
 | |
| ; CHECK1-NEXT:    br label [[OMP_PAR_EXIT_SPLIT:%.*]]
 | |
| ; CHECK1:       omp.par.exit.split:
 | |
| ; CHECK1-NEXT:    br label [[ENTRY_SPLIT_SPLIT:%.*]]
 | |
| ; CHECK1:       entry.split.split:
 | |
| ; CHECK1-NEXT:    [[ADD1_SEQ_OUTPUT_LOAD:%.*]] = load i32, i32* [[ADD1_SEQ_OUTPUT_ALLOC]], align 4
 | |
| ; CHECK1-NEXT:    call void @use(i32 [[ADD1_SEQ_OUTPUT_LOAD]])
 | |
| ; CHECK1-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK1-LABEL: define {{[^@]+}}@merge_3_seq..omp_par
 | |
| ; CHECK1-SAME: (i32* noalias [[TID_ADDR:%.*]], i32* noalias [[ZERO_ADDR:%.*]], { i32*, i32*, i32*, i32* }* [[TMP0:%.*]]) #[[ATTR0]] {
 | |
| ; CHECK1-NEXT:  omp.par.entry:
 | |
| ; CHECK1-NEXT:    [[GEP_A_RELOADED:%.*]] = getelementptr { i32*, i32*, i32*, i32* }, { i32*, i32*, i32*, i32* }* [[TMP0]], i32 0, i32 0
 | |
| ; CHECK1-NEXT:    [[LOADGEP_A_RELOADED:%.*]] = load i32*, i32** [[GEP_A_RELOADED]], align 8
 | |
| ; CHECK1-NEXT:    [[GEP_A_ADDR:%.*]] = getelementptr { i32*, i32*, i32*, i32* }, { i32*, i32*, i32*, i32* }* [[TMP0]], i32 0, i32 1
 | |
| ; CHECK1-NEXT:    [[LOADGEP_A_ADDR:%.*]] = load i32*, i32** [[GEP_A_ADDR]], align 8
 | |
| ; CHECK1-NEXT:    [[GEP_ADD_SEQ_OUTPUT_ALLOC:%.*]] = getelementptr { i32*, i32*, i32*, i32* }, { i32*, i32*, i32*, i32* }* [[TMP0]], i32 0, i32 2
 | |
| ; CHECK1-NEXT:    [[LOADGEP_ADD_SEQ_OUTPUT_ALLOC:%.*]] = load i32*, i32** [[GEP_ADD_SEQ_OUTPUT_ALLOC]], align 8
 | |
| ; CHECK1-NEXT:    [[GEP_ADD1_SEQ_OUTPUT_ALLOC:%.*]] = getelementptr { i32*, i32*, i32*, i32* }, { i32*, i32*, i32*, i32* }* [[TMP0]], i32 0, i32 3
 | |
| ; CHECK1-NEXT:    [[LOADGEP_ADD1_SEQ_OUTPUT_ALLOC:%.*]] = load i32*, i32** [[GEP_ADD1_SEQ_OUTPUT_ALLOC]], align 8
 | |
| ; CHECK1-NEXT:    [[TID_ADDR_LOCAL:%.*]] = alloca i32, align 4
 | |
| ; CHECK1-NEXT:    [[TMP1:%.*]] = load i32, i32* [[TID_ADDR]], align 4
 | |
| ; CHECK1-NEXT:    store i32 [[TMP1]], i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK1-NEXT:    [[TID:%.*]] = load i32, i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK1-NEXT:    [[TMP2:%.*]] = load i32, i32* [[LOADGEP_A_RELOADED]], align 4
 | |
| ; CHECK1-NEXT:    br label [[OMP_PAR_REGION:%.*]]
 | |
| ; CHECK1:       omp.par.region:
 | |
| ; CHECK1-NEXT:    br label [[OMP_PAR_MERGED:%.*]]
 | |
| ; CHECK1:       omp.par.merged:
 | |
| ; CHECK1-NEXT:    call void (i32*, i32*, ...) bitcast (void (i32*, i32*, i32*)* @.omp_outlined..25 to void (i32*, i32*, ...)*)(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[LOADGEP_A_ADDR]])
 | |
| ; CHECK1-NEXT:    [[OMP_GLOBAL_THREAD_NUM2:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB2]])
 | |
| ; CHECK1-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB3]], i32 [[OMP_GLOBAL_THREAD_NUM2]])
 | |
| ; CHECK1-NEXT:    [[OMP_GLOBAL_THREAD_NUM:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB2]])
 | |
| ; CHECK1-NEXT:    [[TMP3:%.*]] = call i32 @__kmpc_master(%struct.ident_t* @[[GLOB2]], i32 [[OMP_GLOBAL_THREAD_NUM]])
 | |
| ; CHECK1-NEXT:    [[TMP4:%.*]] = icmp ne i32 [[TMP3]], 0
 | |
| ; CHECK1-NEXT:    br i1 [[TMP4]], label [[OMP_REGION_BODY:%.*]], label [[OMP_REGION_END:%.*]]
 | |
| ; CHECK1:       omp_region.end:
 | |
| ; CHECK1-NEXT:    [[OMP_GLOBAL_THREAD_NUM1:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB2]])
 | |
| ; CHECK1-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB3]], i32 [[OMP_GLOBAL_THREAD_NUM1]])
 | |
| ; CHECK1-NEXT:    br label [[OMP_PAR_MERGED_SPLIT_SPLIT:%.*]]
 | |
| ; CHECK1:       omp.par.merged.split.split:
 | |
| ; CHECK1-NEXT:    call void (i32*, i32*, ...) bitcast (void (i32*, i32*, i32*)* @.omp_outlined..26 to void (i32*, i32*, ...)*)(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[LOADGEP_A_ADDR]])
 | |
| ; CHECK1-NEXT:    [[OMP_GLOBAL_THREAD_NUM4:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB2]])
 | |
| ; CHECK1-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB3]], i32 [[OMP_GLOBAL_THREAD_NUM4]])
 | |
| ; CHECK1-NEXT:    [[OMP_GLOBAL_THREAD_NUM3:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB2]])
 | |
| ; CHECK1-NEXT:    [[TMP5:%.*]] = call i32 @__kmpc_master(%struct.ident_t* @[[GLOB2]], i32 [[OMP_GLOBAL_THREAD_NUM3]])
 | |
| ; CHECK1-NEXT:    [[TMP6:%.*]] = icmp ne i32 [[TMP5]], 0
 | |
| ; CHECK1-NEXT:    br i1 [[TMP6]], label [[OMP_REGION_BODY5:%.*]], label [[OMP_REGION_END4:%.*]]
 | |
| ; CHECK1:       omp_region.end4:
 | |
| ; CHECK1-NEXT:    [[OMP_GLOBAL_THREAD_NUM6:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB2]])
 | |
| ; CHECK1-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB3]], i32 [[OMP_GLOBAL_THREAD_NUM6]])
 | |
| ; CHECK1-NEXT:    br label [[OMP_PAR_MERGED_SPLIT_SPLIT_SPLIT_SPLIT:%.*]]
 | |
| ; CHECK1:       omp.par.merged.split.split.split.split:
 | |
| ; CHECK1-NEXT:    call void (i32*, i32*, ...) bitcast (void (i32*, i32*, i32*)* @.omp_outlined..27 to void (i32*, i32*, ...)*)(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[LOADGEP_A_ADDR]])
 | |
| ; CHECK1-NEXT:    br label [[ENTRY_SPLIT:%.*]]
 | |
| ; CHECK1:       entry.split:
 | |
| ; CHECK1-NEXT:    br label [[OMP_PAR_REGION_SPLIT:%.*]]
 | |
| ; CHECK1:       omp.par.region.split:
 | |
| ; CHECK1-NEXT:    br label [[OMP_PAR_PRE_FINALIZE:%.*]]
 | |
| ; CHECK1:       omp.par.pre_finalize:
 | |
| ; CHECK1-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT_EXITSTUB:%.*]]
 | |
| ; CHECK1:       omp_region.body5:
 | |
| ; CHECK1-NEXT:    br label [[SEQ_PAR_MERGED2:%.*]]
 | |
| ; CHECK1:       seq.par.merged2:
 | |
| ; CHECK1-NEXT:    [[ADD_SEQ_OUTPUT_LOAD:%.*]] = load i32, i32* [[LOADGEP_ADD_SEQ_OUTPUT_ALLOC]], align 4
 | |
| ; CHECK1-NEXT:    [[ADD1:%.*]] = add nsw i32 [[ADD_SEQ_OUTPUT_LOAD]], [[TMP2]]
 | |
| ; CHECK1-NEXT:    store i32 [[ADD1]], i32* [[LOADGEP_ADD1_SEQ_OUTPUT_ALLOC]], align 4
 | |
| ; CHECK1-NEXT:    br label [[OMP_PAR_MERGED_SPLIT_SPLIT_SPLIT:%.*]]
 | |
| ; CHECK1:       omp.par.merged.split.split.split:
 | |
| ; CHECK1-NEXT:    br label [[OMP_REGION_BODY5_SPLIT:%.*]]
 | |
| ; CHECK1:       omp_region.body5.split:
 | |
| ; CHECK1-NEXT:    call void @__kmpc_end_master(%struct.ident_t* @[[GLOB2]], i32 [[OMP_GLOBAL_THREAD_NUM3]])
 | |
| ; CHECK1-NEXT:    br label [[OMP_REGION_END4]]
 | |
| ; CHECK1:       omp_region.body:
 | |
| ; CHECK1-NEXT:    br label [[SEQ_PAR_MERGED:%.*]]
 | |
| ; CHECK1:       seq.par.merged:
 | |
| ; CHECK1-NEXT:    [[ADD:%.*]] = add nsw i32 [[TMP2]], 1
 | |
| ; CHECK1-NEXT:    store i32 [[ADD]], i32* [[LOADGEP_ADD_SEQ_OUTPUT_ALLOC]], align 4
 | |
| ; CHECK1-NEXT:    br label [[OMP_PAR_MERGED_SPLIT:%.*]]
 | |
| ; CHECK1:       omp.par.merged.split:
 | |
| ; CHECK1-NEXT:    br label [[OMP_REGION_BODY_SPLIT:%.*]]
 | |
| ; CHECK1:       omp_region.body.split:
 | |
| ; CHECK1-NEXT:    call void @__kmpc_end_master(%struct.ident_t* @[[GLOB2]], i32 [[OMP_GLOBAL_THREAD_NUM]])
 | |
| ; CHECK1-NEXT:    br label [[OMP_REGION_END]]
 | |
| ; CHECK1:       omp.par.outlined.exit.exitStub:
 | |
| ; CHECK1-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK1-LABEL: define {{[^@]+}}@.omp_outlined..25
 | |
| ; CHECK1-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK1-NEXT:  entry:
 | |
| ; CHECK1-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK1-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK1-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK1-LABEL: define {{[^@]+}}@.omp_outlined..26
 | |
| ; CHECK1-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK1-NEXT:  entry:
 | |
| ; CHECK1-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK1-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK1-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK1-LABEL: define {{[^@]+}}@.omp_outlined..27
 | |
| ; CHECK1-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK1-NEXT:  entry:
 | |
| ; CHECK1-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK1-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK1-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK1-LABEL: define {{[^@]+}}@unmergable_3_seq_call
 | |
| ; CHECK1-SAME: (i32 [[A:%.*]]) local_unnamed_addr {
 | |
| ; CHECK1-NEXT:  entry:
 | |
| ; CHECK1-NEXT:    [[A_ADDR:%.*]] = alloca i32, align 4
 | |
| ; CHECK1-NEXT:    store i32 [[A]], i32* [[A_ADDR]], align 4
 | |
| ; CHECK1-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]], i32 noundef 1, void (i32*, i32*, ...)* noundef bitcast (void (i32*, i32*, i32*)* @.omp_outlined..28 to void (i32*, i32*, ...)*), i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK1-NEXT:    call void (...) @foo()
 | |
| ; CHECK1-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]], i32 noundef 1, void (i32*, i32*, ...)* noundef bitcast (void (i32*, i32*, i32*)* @.omp_outlined..29 to void (i32*, i32*, ...)*), i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK1-NEXT:    call void (...) @foo()
 | |
| ; CHECK1-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]], i32 noundef 1, void (i32*, i32*, ...)* noundef bitcast (void (i32*, i32*, i32*)* @.omp_outlined..30 to void (i32*, i32*, ...)*), i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK1-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK1-LABEL: define {{[^@]+}}@.omp_outlined..28
 | |
| ; CHECK1-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK1-NEXT:  entry:
 | |
| ; CHECK1-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK1-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK1-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK1-LABEL: define {{[^@]+}}@.omp_outlined..29
 | |
| ; CHECK1-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK1-NEXT:  entry:
 | |
| ; CHECK1-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK1-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK1-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK1-LABEL: define {{[^@]+}}@.omp_outlined..30
 | |
| ; CHECK1-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK1-NEXT:  entry:
 | |
| ; CHECK1-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK1-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK1-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK1-LABEL: define {{[^@]+}}@unmergable_3_proc_bind
 | |
| ; CHECK1-SAME: (i32 [[A:%.*]]) local_unnamed_addr {
 | |
| ; CHECK1-NEXT:  entry:
 | |
| ; CHECK1-NEXT:    [[A_ADDR:%.*]] = alloca i32, align 4
 | |
| ; CHECK1-NEXT:    [[TMP0:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]])
 | |
| ; CHECK1-NEXT:    store i32 [[A]], i32* [[A_ADDR]], align 4
 | |
| ; CHECK1-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]], i32 noundef 1, void (i32*, i32*, ...)* noundef bitcast (void (i32*, i32*, i32*)* @.omp_outlined..31 to void (i32*, i32*, ...)*), i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK1-NEXT:    call void @__kmpc_push_proc_bind(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]], i32 [[TMP0]], i32 noundef 3)
 | |
| ; CHECK1-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]], i32 noundef 1, void (i32*, i32*, ...)* noundef bitcast (void (i32*, i32*, i32*)* @.omp_outlined..32 to void (i32*, i32*, ...)*), i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK1-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]], i32 noundef 1, void (i32*, i32*, ...)* noundef bitcast (void (i32*, i32*, i32*)* @.omp_outlined..33 to void (i32*, i32*, ...)*), i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK1-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK1-LABEL: define {{[^@]+}}@.omp_outlined..31
 | |
| ; CHECK1-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK1-NEXT:  entry:
 | |
| ; CHECK1-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK1-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK1-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK1-LABEL: define {{[^@]+}}@.omp_outlined..32
 | |
| ; CHECK1-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK1-NEXT:  entry:
 | |
| ; CHECK1-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK1-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK1-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK1-LABEL: define {{[^@]+}}@.omp_outlined..33
 | |
| ; CHECK1-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK1-NEXT:  entry:
 | |
| ; CHECK1-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK1-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK1-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK1-LABEL: define {{[^@]+}}@unmergable_3_num_threads
 | |
| ; CHECK1-SAME: (i32 [[A:%.*]]) local_unnamed_addr {
 | |
| ; CHECK1-NEXT:  entry:
 | |
| ; CHECK1-NEXT:    [[A_ADDR:%.*]] = alloca i32, align 4
 | |
| ; CHECK1-NEXT:    [[TMP0:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]])
 | |
| ; CHECK1-NEXT:    store i32 [[A]], i32* [[A_ADDR]], align 4
 | |
| ; CHECK1-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]], i32 noundef 1, void (i32*, i32*, ...)* noundef bitcast (void (i32*, i32*, i32*)* @.omp_outlined..34 to void (i32*, i32*, ...)*), i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK1-NEXT:    call void @__kmpc_push_num_threads(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]], i32 [[TMP0]], i32 [[A]])
 | |
| ; CHECK1-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]], i32 noundef 1, void (i32*, i32*, ...)* noundef bitcast (void (i32*, i32*, i32*)* @.omp_outlined..35 to void (i32*, i32*, ...)*), i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK1-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]], i32 noundef 1, void (i32*, i32*, ...)* noundef bitcast (void (i32*, i32*, i32*)* @.omp_outlined..36 to void (i32*, i32*, ...)*), i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK1-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK1-LABEL: define {{[^@]+}}@.omp_outlined..34
 | |
| ; CHECK1-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK1-NEXT:  entry:
 | |
| ; CHECK1-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK1-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK1-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK1-LABEL: define {{[^@]+}}@.omp_outlined..35
 | |
| ; CHECK1-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK1-NEXT:  entry:
 | |
| ; CHECK1-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK1-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK1-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK1-LABEL: define {{[^@]+}}@.omp_outlined..36
 | |
| ; CHECK1-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK1-NEXT:  entry:
 | |
| ; CHECK1-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK1-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK1-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK1-LABEL: define {{[^@]+}}@merge_2_unmergable_1
 | |
| ; CHECK1-SAME: (i32 [[A:%.*]]) local_unnamed_addr {
 | |
| ; CHECK1-NEXT:  entry:
 | |
| ; CHECK1-NEXT:    [[STRUCTARG:%.*]] = alloca { i32* }, align 8
 | |
| ; CHECK1-NEXT:    [[A_ADDR:%.*]] = alloca i32, align 4
 | |
| ; CHECK1-NEXT:    store i32 [[A]], i32* [[A_ADDR]], align 4
 | |
| ; CHECK1-NEXT:    [[OMP_GLOBAL_THREAD_NUM:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB2]])
 | |
| ; CHECK1-NEXT:    br label [[OMP_PARALLEL:%.*]]
 | |
| ; CHECK1:       omp_parallel:
 | |
| ; CHECK1-NEXT:    [[GEP_A_ADDR:%.*]] = getelementptr { i32* }, { i32* }* [[STRUCTARG]], i32 0, i32 0
 | |
| ; CHECK1-NEXT:    store i32* [[A_ADDR]], i32** [[GEP_A_ADDR]], align 8
 | |
| ; CHECK1-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB2]], i32 1, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, { i32* }*)* @merge_2_unmergable_1..omp_par to void (i32*, i32*, ...)*), { i32* }* [[STRUCTARG]])
 | |
| ; CHECK1-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT:%.*]]
 | |
| ; CHECK1:       omp.par.outlined.exit:
 | |
| ; CHECK1-NEXT:    br label [[OMP_PAR_EXIT_SPLIT:%.*]]
 | |
| ; CHECK1:       omp.par.exit.split:
 | |
| ; CHECK1-NEXT:    br label [[ENTRY_SPLIT_SPLIT:%.*]]
 | |
| ; CHECK1:       entry.split.split:
 | |
| ; CHECK1-NEXT:    call void (...) @foo()
 | |
| ; CHECK1-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]], i32 noundef 1, void (i32*, i32*, ...)* noundef bitcast (void (i32*, i32*, i32*)* @.omp_outlined..39 to void (i32*, i32*, ...)*), i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK1-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK1-LABEL: define {{[^@]+}}@merge_2_unmergable_1..omp_par
 | |
| ; CHECK1-SAME: (i32* noalias [[TID_ADDR:%.*]], i32* noalias [[ZERO_ADDR:%.*]], { i32* }* [[TMP0:%.*]]) #[[ATTR0]] {
 | |
| ; CHECK1-NEXT:  omp.par.entry:
 | |
| ; CHECK1-NEXT:    [[GEP_A_ADDR:%.*]] = getelementptr { i32* }, { i32* }* [[TMP0]], i32 0, i32 0
 | |
| ; CHECK1-NEXT:    [[LOADGEP_A_ADDR:%.*]] = load i32*, i32** [[GEP_A_ADDR]], align 8
 | |
| ; CHECK1-NEXT:    [[TID_ADDR_LOCAL:%.*]] = alloca i32, align 4
 | |
| ; CHECK1-NEXT:    [[TMP1:%.*]] = load i32, i32* [[TID_ADDR]], align 4
 | |
| ; CHECK1-NEXT:    store i32 [[TMP1]], i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK1-NEXT:    [[TID:%.*]] = load i32, i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK1-NEXT:    br label [[OMP_PAR_REGION:%.*]]
 | |
| ; CHECK1:       omp.par.region:
 | |
| ; CHECK1-NEXT:    br label [[OMP_PAR_MERGED:%.*]]
 | |
| ; CHECK1:       omp.par.merged:
 | |
| ; CHECK1-NEXT:    call void (i32*, i32*, ...) bitcast (void (i32*, i32*, i32*)* @.omp_outlined..37 to void (i32*, i32*, ...)*)(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[LOADGEP_A_ADDR]])
 | |
| ; CHECK1-NEXT:    [[OMP_GLOBAL_THREAD_NUM:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB2]])
 | |
| ; CHECK1-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB3]], i32 [[OMP_GLOBAL_THREAD_NUM]])
 | |
| ; CHECK1-NEXT:    call void (i32*, i32*, ...) bitcast (void (i32*, i32*, i32*)* @.omp_outlined..38 to void (i32*, i32*, ...)*)(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[LOADGEP_A_ADDR]])
 | |
| ; CHECK1-NEXT:    br label [[ENTRY_SPLIT:%.*]]
 | |
| ; CHECK1:       entry.split:
 | |
| ; CHECK1-NEXT:    br label [[OMP_PAR_REGION_SPLIT:%.*]]
 | |
| ; CHECK1:       omp.par.region.split:
 | |
| ; CHECK1-NEXT:    br label [[OMP_PAR_PRE_FINALIZE:%.*]]
 | |
| ; CHECK1:       omp.par.pre_finalize:
 | |
| ; CHECK1-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT_EXITSTUB:%.*]]
 | |
| ; CHECK1:       omp.par.outlined.exit.exitStub:
 | |
| ; CHECK1-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK1-LABEL: define {{[^@]+}}@.omp_outlined..37
 | |
| ; CHECK1-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK1-NEXT:  entry:
 | |
| ; CHECK1-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK1-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK1-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK1-LABEL: define {{[^@]+}}@.omp_outlined..38
 | |
| ; CHECK1-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK1-NEXT:  entry:
 | |
| ; CHECK1-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK1-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK1-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK1-LABEL: define {{[^@]+}}@.omp_outlined..39
 | |
| ; CHECK1-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK1-NEXT:  entry:
 | |
| ; CHECK1-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK1-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK1-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK2-LABEL: define {{[^@]+}}@merge
 | |
| ; CHECK2-SAME: (i32 [[A:%.*]]) local_unnamed_addr {
 | |
| ; CHECK2-NEXT:  entry:
 | |
| ; CHECK2-NEXT:    [[STRUCTARG:%.*]] = alloca { i32* }, align 8
 | |
| ; CHECK2-NEXT:    [[A_ADDR:%.*]] = alloca i32, align 4
 | |
| ; CHECK2-NEXT:    store i32 [[A]], i32* [[A_ADDR]], align 4
 | |
| ; CHECK2-NEXT:    [[OMP_GLOBAL_THREAD_NUM:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB2:[0-9]+]])
 | |
| ; CHECK2-NEXT:    br label [[OMP_PARALLEL:%.*]]
 | |
| ; CHECK2:       omp_parallel:
 | |
| ; CHECK2-NEXT:    [[GEP_A_ADDR:%.*]] = getelementptr { i32* }, { i32* }* [[STRUCTARG]], i32 0, i32 0
 | |
| ; CHECK2-NEXT:    store i32* [[A_ADDR]], i32** [[GEP_A_ADDR]], align 8
 | |
| ; CHECK2-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB2]], i32 1, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, { i32* }*)* @merge..omp_par to void (i32*, i32*, ...)*), { i32* }* [[STRUCTARG]])
 | |
| ; CHECK2-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT:%.*]]
 | |
| ; CHECK2:       omp.par.outlined.exit:
 | |
| ; CHECK2-NEXT:    br label [[OMP_PAR_EXIT_SPLIT:%.*]]
 | |
| ; CHECK2:       omp.par.exit.split:
 | |
| ; CHECK2-NEXT:    br label [[ENTRY_SPLIT_SPLIT:%.*]]
 | |
| ; CHECK2:       entry.split.split:
 | |
| ; CHECK2-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK2-LABEL: define {{[^@]+}}@merge..omp_par
 | |
| ; CHECK2-SAME: (i32* noalias [[TID_ADDR:%.*]], i32* noalias [[ZERO_ADDR:%.*]], { i32* }* [[TMP0:%.*]]) #[[ATTR0:[0-9]+]] {
 | |
| ; CHECK2-NEXT:  omp.par.entry:
 | |
| ; CHECK2-NEXT:    [[GEP_A_ADDR:%.*]] = getelementptr { i32* }, { i32* }* [[TMP0]], i32 0, i32 0
 | |
| ; CHECK2-NEXT:    [[LOADGEP_A_ADDR:%.*]] = load i32*, i32** [[GEP_A_ADDR]], align 8
 | |
| ; CHECK2-NEXT:    [[TID_ADDR_LOCAL:%.*]] = alloca i32, align 4
 | |
| ; CHECK2-NEXT:    [[TMP1:%.*]] = load i32, i32* [[TID_ADDR]], align 4
 | |
| ; CHECK2-NEXT:    store i32 [[TMP1]], i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK2-NEXT:    [[TID:%.*]] = load i32, i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK2-NEXT:    br label [[OMP_PAR_REGION:%.*]]
 | |
| ; CHECK2:       omp.par.region:
 | |
| ; CHECK2-NEXT:    br label [[OMP_PAR_MERGED:%.*]]
 | |
| ; CHECK2:       omp.par.merged:
 | |
| ; CHECK2-NEXT:    call void (i32*, i32*, ...) bitcast (void (i32*, i32*, i32*)* @.omp_outlined. to void (i32*, i32*, ...)*)(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[LOADGEP_A_ADDR]])
 | |
| ; CHECK2-NEXT:    [[OMP_GLOBAL_THREAD_NUM:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB2]])
 | |
| ; CHECK2-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB3:[0-9]+]], i32 [[OMP_GLOBAL_THREAD_NUM]])
 | |
| ; CHECK2-NEXT:    call void (i32*, i32*, ...) bitcast (void (i32*, i32*, i32*)* @.omp_outlined..1 to void (i32*, i32*, ...)*)(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[LOADGEP_A_ADDR]])
 | |
| ; CHECK2-NEXT:    br label [[ENTRY_SPLIT:%.*]]
 | |
| ; CHECK2:       entry.split:
 | |
| ; CHECK2-NEXT:    br label [[OMP_PAR_REGION_SPLIT:%.*]]
 | |
| ; CHECK2:       omp.par.region.split:
 | |
| ; CHECK2-NEXT:    br label [[OMP_PAR_PRE_FINALIZE:%.*]]
 | |
| ; CHECK2:       omp.par.pre_finalize:
 | |
| ; CHECK2-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT_EXITSTUB:%.*]]
 | |
| ; CHECK2:       omp.par.outlined.exit.exitStub:
 | |
| ; CHECK2-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK2-LABEL: define {{[^@]+}}@.omp_outlined.
 | |
| ; CHECK2-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK2-NEXT:  entry:
 | |
| ; CHECK2-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK2-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK2-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK2-LABEL: define {{[^@]+}}@.omp_outlined..1
 | |
| ; CHECK2-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK2-NEXT:  entry:
 | |
| ; CHECK2-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK2-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK2-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK2-LABEL: define {{[^@]+}}@unmergable_proc_bind
 | |
| ; CHECK2-SAME: (i32 [[A:%.*]]) local_unnamed_addr {
 | |
| ; CHECK2-NEXT:  entry:
 | |
| ; CHECK2-NEXT:    [[A_ADDR:%.*]] = alloca i32, align 4
 | |
| ; CHECK2-NEXT:    [[TMP0:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1:[0-9]+]])
 | |
| ; CHECK2-NEXT:    store i32 [[A]], i32* [[A_ADDR]], align 4
 | |
| ; CHECK2-NEXT:    call void @__kmpc_push_proc_bind(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]], i32 [[TMP0]], i32 noundef 3)
 | |
| ; CHECK2-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]], i32 noundef 1, void (i32*, i32*, ...)* noundef bitcast (void (i32*, i32*, i32*)* @.omp_outlined..2 to void (i32*, i32*, ...)*), i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK2-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]], i32 noundef 1, void (i32*, i32*, ...)* noundef bitcast (void (i32*, i32*, i32*)* @.omp_outlined..3 to void (i32*, i32*, ...)*), i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK2-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK2-LABEL: define {{[^@]+}}@.omp_outlined..2
 | |
| ; CHECK2-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK2-NEXT:  entry:
 | |
| ; CHECK2-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK2-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK2-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK2-LABEL: define {{[^@]+}}@.omp_outlined..3
 | |
| ; CHECK2-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK2-NEXT:  entry:
 | |
| ; CHECK2-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK2-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK2-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK2-LABEL: define {{[^@]+}}@unmergable_num_threads
 | |
| ; CHECK2-SAME: (i32 [[A:%.*]]) local_unnamed_addr {
 | |
| ; CHECK2-NEXT:  entry:
 | |
| ; CHECK2-NEXT:    [[A_ADDR:%.*]] = alloca i32, align 4
 | |
| ; CHECK2-NEXT:    [[TMP0:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]])
 | |
| ; CHECK2-NEXT:    store i32 [[A]], i32* [[A_ADDR]], align 4
 | |
| ; CHECK2-NEXT:    call void @__kmpc_push_num_threads(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]], i32 [[TMP0]], i32 [[A]])
 | |
| ; CHECK2-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]], i32 noundef 1, void (i32*, i32*, ...)* noundef bitcast (void (i32*, i32*, i32*)* @.omp_outlined..4 to void (i32*, i32*, ...)*), i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK2-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]], i32 noundef 1, void (i32*, i32*, ...)* noundef bitcast (void (i32*, i32*, i32*)* @.omp_outlined..5 to void (i32*, i32*, ...)*), i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK2-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK2-LABEL: define {{[^@]+}}@.omp_outlined..4
 | |
| ; CHECK2-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK2-NEXT:  entry:
 | |
| ; CHECK2-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK2-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK2-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK2-LABEL: define {{[^@]+}}@.omp_outlined..5
 | |
| ; CHECK2-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK2-NEXT:  entry:
 | |
| ; CHECK2-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK2-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK2-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK2-LABEL: define {{[^@]+}}@unmergable_seq_call
 | |
| ; CHECK2-SAME: (i32 [[A:%.*]]) local_unnamed_addr {
 | |
| ; CHECK2-NEXT:  entry:
 | |
| ; CHECK2-NEXT:    [[A_ADDR:%.*]] = alloca i32, align 4
 | |
| ; CHECK2-NEXT:    store i32 [[A]], i32* [[A_ADDR]], align 4
 | |
| ; CHECK2-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]], i32 noundef 1, void (i32*, i32*, ...)* noundef bitcast (void (i32*, i32*, i32*)* @.omp_outlined..6 to void (i32*, i32*, ...)*), i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK2-NEXT:    call void (...) @foo()
 | |
| ; CHECK2-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]], i32 noundef 1, void (i32*, i32*, ...)* noundef bitcast (void (i32*, i32*, i32*)* @.omp_outlined..7 to void (i32*, i32*, ...)*), i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK2-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK2-LABEL: define {{[^@]+}}@.omp_outlined..6
 | |
| ; CHECK2-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK2-NEXT:  entry:
 | |
| ; CHECK2-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK2-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK2-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK2-LABEL: define {{[^@]+}}@.omp_outlined..7
 | |
| ; CHECK2-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK2-NEXT:  entry:
 | |
| ; CHECK2-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK2-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK2-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK2-LABEL: define {{[^@]+}}@merge_seq
 | |
| ; CHECK2-SAME: (i32 [[A:%.*]]) local_unnamed_addr {
 | |
| ; CHECK2-NEXT:  entry:
 | |
| ; CHECK2-NEXT:    [[STRUCTARG:%.*]] = alloca { i32* }, align 8
 | |
| ; CHECK2-NEXT:    [[A_ADDR:%.*]] = alloca i32, align 4
 | |
| ; CHECK2-NEXT:    store i32 [[A]], i32* [[A_ADDR]], align 4
 | |
| ; CHECK2-NEXT:    [[OMP_GLOBAL_THREAD_NUM2:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB2]])
 | |
| ; CHECK2-NEXT:    br label [[OMP_PARALLEL:%.*]]
 | |
| ; CHECK2:       omp_parallel:
 | |
| ; CHECK2-NEXT:    [[GEP_A_ADDR:%.*]] = getelementptr { i32* }, { i32* }* [[STRUCTARG]], i32 0, i32 0
 | |
| ; CHECK2-NEXT:    store i32* [[A_ADDR]], i32** [[GEP_A_ADDR]], align 8
 | |
| ; CHECK2-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB2]], i32 1, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, { i32* }*)* @merge_seq..omp_par to void (i32*, i32*, ...)*), { i32* }* [[STRUCTARG]])
 | |
| ; CHECK2-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT:%.*]]
 | |
| ; CHECK2:       omp.par.outlined.exit:
 | |
| ; CHECK2-NEXT:    br label [[OMP_PAR_EXIT_SPLIT:%.*]]
 | |
| ; CHECK2:       omp.par.exit.split:
 | |
| ; CHECK2-NEXT:    br label [[ENTRY_SPLIT_SPLIT:%.*]]
 | |
| ; CHECK2:       entry.split.split:
 | |
| ; CHECK2-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A_ADDR]], align 4
 | |
| ; CHECK2-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK2-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK2-LABEL: define {{[^@]+}}@merge_seq..omp_par
 | |
| ; CHECK2-SAME: (i32* noalias [[TID_ADDR:%.*]], i32* noalias [[ZERO_ADDR:%.*]], { i32* }* [[TMP0:%.*]]) #[[ATTR0]] {
 | |
| ; CHECK2-NEXT:  omp.par.entry:
 | |
| ; CHECK2-NEXT:    [[GEP_A_ADDR:%.*]] = getelementptr { i32* }, { i32* }* [[TMP0]], i32 0, i32 0
 | |
| ; CHECK2-NEXT:    [[LOADGEP_A_ADDR:%.*]] = load i32*, i32** [[GEP_A_ADDR]], align 8
 | |
| ; CHECK2-NEXT:    [[TID_ADDR_LOCAL:%.*]] = alloca i32, align 4
 | |
| ; CHECK2-NEXT:    [[TMP1:%.*]] = load i32, i32* [[TID_ADDR]], align 4
 | |
| ; CHECK2-NEXT:    store i32 [[TMP1]], i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK2-NEXT:    [[TID:%.*]] = load i32, i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK2-NEXT:    br label [[OMP_PAR_REGION:%.*]]
 | |
| ; CHECK2:       omp.par.region:
 | |
| ; CHECK2-NEXT:    br label [[OMP_PAR_MERGED:%.*]]
 | |
| ; CHECK2:       omp.par.merged:
 | |
| ; CHECK2-NEXT:    call void (i32*, i32*, ...) bitcast (void (i32*, i32*, i32*)* @.omp_outlined..8 to void (i32*, i32*, ...)*)(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[LOADGEP_A_ADDR]])
 | |
| ; CHECK2-NEXT:    [[OMP_GLOBAL_THREAD_NUM2:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB2]])
 | |
| ; CHECK2-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB3]], i32 [[OMP_GLOBAL_THREAD_NUM2]])
 | |
| ; CHECK2-NEXT:    [[OMP_GLOBAL_THREAD_NUM:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB2]])
 | |
| ; CHECK2-NEXT:    [[TMP2:%.*]] = call i32 @__kmpc_master(%struct.ident_t* @[[GLOB2]], i32 [[OMP_GLOBAL_THREAD_NUM]])
 | |
| ; CHECK2-NEXT:    [[TMP3:%.*]] = icmp ne i32 [[TMP2]], 0
 | |
| ; CHECK2-NEXT:    br i1 [[TMP3]], label [[OMP_REGION_BODY:%.*]], label [[OMP_REGION_END:%.*]]
 | |
| ; CHECK2:       omp_region.end:
 | |
| ; CHECK2-NEXT:    [[OMP_GLOBAL_THREAD_NUM1:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB2]])
 | |
| ; CHECK2-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB3]], i32 [[OMP_GLOBAL_THREAD_NUM1]])
 | |
| ; CHECK2-NEXT:    br label [[OMP_PAR_MERGED_SPLIT_SPLIT:%.*]]
 | |
| ; CHECK2:       omp.par.merged.split.split:
 | |
| ; CHECK2-NEXT:    call void (i32*, i32*, ...) bitcast (void (i32*, i32*, i32*)* @.omp_outlined..9 to void (i32*, i32*, ...)*)(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[LOADGEP_A_ADDR]])
 | |
| ; CHECK2-NEXT:    br label [[ENTRY_SPLIT:%.*]]
 | |
| ; CHECK2:       entry.split:
 | |
| ; CHECK2-NEXT:    br label [[OMP_PAR_REGION_SPLIT:%.*]]
 | |
| ; CHECK2:       omp.par.region.split:
 | |
| ; CHECK2-NEXT:    br label [[OMP_PAR_PRE_FINALIZE:%.*]]
 | |
| ; CHECK2:       omp.par.pre_finalize:
 | |
| ; CHECK2-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT_EXITSTUB:%.*]]
 | |
| ; CHECK2:       omp_region.body:
 | |
| ; CHECK2-NEXT:    br label [[SEQ_PAR_MERGED:%.*]]
 | |
| ; CHECK2:       seq.par.merged:
 | |
| ; CHECK2-NEXT:    [[TMP4:%.*]] = load i32, i32* [[LOADGEP_A_ADDR]], align 4
 | |
| ; CHECK2-NEXT:    [[ADD:%.*]] = add nsw i32 [[TMP4]], 1
 | |
| ; CHECK2-NEXT:    store i32 [[ADD]], i32* [[LOADGEP_A_ADDR]], align 4
 | |
| ; CHECK2-NEXT:    br label [[OMP_PAR_MERGED_SPLIT:%.*]]
 | |
| ; CHECK2:       omp.par.merged.split:
 | |
| ; CHECK2-NEXT:    br label [[OMP_REGION_BODY_SPLIT:%.*]]
 | |
| ; CHECK2:       omp_region.body.split:
 | |
| ; CHECK2-NEXT:    call void @__kmpc_end_master(%struct.ident_t* @[[GLOB2]], i32 [[OMP_GLOBAL_THREAD_NUM]])
 | |
| ; CHECK2-NEXT:    br label [[OMP_REGION_END]]
 | |
| ; CHECK2:       omp.par.outlined.exit.exitStub:
 | |
| ; CHECK2-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK2-LABEL: define {{[^@]+}}@.omp_outlined..8
 | |
| ; CHECK2-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK2-NEXT:  entry:
 | |
| ; CHECK2-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK2-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK2-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK2-LABEL: define {{[^@]+}}@.omp_outlined..9
 | |
| ; CHECK2-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK2-NEXT:  entry:
 | |
| ; CHECK2-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK2-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK2-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK2-LABEL: define {{[^@]+}}@merge_seq_float
 | |
| ; CHECK2-SAME: (float [[F:%.*]], float* nocapture nofree writeonly [[P:%.*]]) local_unnamed_addr {
 | |
| ; CHECK2-NEXT:  entry:
 | |
| ; CHECK2-NEXT:    [[STRUCTARG:%.*]] = alloca { float*, float*, float* }, align 8
 | |
| ; CHECK2-NEXT:    [[F_RELOADED:%.*]] = alloca float, align 4
 | |
| ; CHECK2-NEXT:    [[F_ADDR:%.*]] = alloca float, align 4
 | |
| ; CHECK2-NEXT:    store float [[F]], float* [[F_ADDR]], align 4
 | |
| ; CHECK2-NEXT:    [[OMP_GLOBAL_THREAD_NUM2:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB2]])
 | |
| ; CHECK2-NEXT:    store float [[F]], float* [[F_RELOADED]], align 4
 | |
| ; CHECK2-NEXT:    br label [[OMP_PARALLEL:%.*]]
 | |
| ; CHECK2:       omp_parallel:
 | |
| ; CHECK2-NEXT:    [[GEP_F_RELOADED:%.*]] = getelementptr { float*, float*, float* }, { float*, float*, float* }* [[STRUCTARG]], i32 0, i32 0
 | |
| ; CHECK2-NEXT:    store float* [[F_RELOADED]], float** [[GEP_F_RELOADED]], align 8
 | |
| ; CHECK2-NEXT:    [[GEP_F_ADDR:%.*]] = getelementptr { float*, float*, float* }, { float*, float*, float* }* [[STRUCTARG]], i32 0, i32 1
 | |
| ; CHECK2-NEXT:    store float* [[F_ADDR]], float** [[GEP_F_ADDR]], align 8
 | |
| ; CHECK2-NEXT:    [[GEP_P:%.*]] = getelementptr { float*, float*, float* }, { float*, float*, float* }* [[STRUCTARG]], i32 0, i32 2
 | |
| ; CHECK2-NEXT:    store float* [[P]], float** [[GEP_P]], align 8
 | |
| ; CHECK2-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB2]], i32 1, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, { float*, float*, float* }*)* @merge_seq_float..omp_par to void (i32*, i32*, ...)*), { float*, float*, float* }* [[STRUCTARG]])
 | |
| ; CHECK2-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT:%.*]]
 | |
| ; CHECK2:       omp.par.outlined.exit:
 | |
| ; CHECK2-NEXT:    br label [[OMP_PAR_EXIT_SPLIT:%.*]]
 | |
| ; CHECK2:       omp.par.exit.split:
 | |
| ; CHECK2-NEXT:    br label [[ENTRY_SPLIT_SPLIT:%.*]]
 | |
| ; CHECK2:       entry.split.split:
 | |
| ; CHECK2-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK2-LABEL: define {{[^@]+}}@merge_seq_float..omp_par
 | |
| ; CHECK2-SAME: (i32* noalias [[TID_ADDR:%.*]], i32* noalias [[ZERO_ADDR:%.*]], { float*, float*, float* }* [[TMP0:%.*]]) #[[ATTR0]] {
 | |
| ; CHECK2-NEXT:  omp.par.entry:
 | |
| ; CHECK2-NEXT:    [[GEP_F_RELOADED:%.*]] = getelementptr { float*, float*, float* }, { float*, float*, float* }* [[TMP0]], i32 0, i32 0
 | |
| ; CHECK2-NEXT:    [[LOADGEP_F_RELOADED:%.*]] = load float*, float** [[GEP_F_RELOADED]], align 8
 | |
| ; CHECK2-NEXT:    [[GEP_F_ADDR:%.*]] = getelementptr { float*, float*, float* }, { float*, float*, float* }* [[TMP0]], i32 0, i32 1
 | |
| ; CHECK2-NEXT:    [[LOADGEP_F_ADDR:%.*]] = load float*, float** [[GEP_F_ADDR]], align 8
 | |
| ; CHECK2-NEXT:    [[GEP_P:%.*]] = getelementptr { float*, float*, float* }, { float*, float*, float* }* [[TMP0]], i32 0, i32 2
 | |
| ; CHECK2-NEXT:    [[LOADGEP_P:%.*]] = load float*, float** [[GEP_P]], align 8
 | |
| ; CHECK2-NEXT:    [[TID_ADDR_LOCAL:%.*]] = alloca i32, align 4
 | |
| ; CHECK2-NEXT:    [[TMP1:%.*]] = load i32, i32* [[TID_ADDR]], align 4
 | |
| ; CHECK2-NEXT:    store i32 [[TMP1]], i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK2-NEXT:    [[TID:%.*]] = load i32, i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK2-NEXT:    [[TMP2:%.*]] = load float, float* [[LOADGEP_F_RELOADED]], align 4
 | |
| ; CHECK2-NEXT:    br label [[OMP_PAR_REGION:%.*]]
 | |
| ; CHECK2:       omp.par.region:
 | |
| ; CHECK2-NEXT:    br label [[OMP_PAR_MERGED:%.*]]
 | |
| ; CHECK2:       omp.par.merged:
 | |
| ; CHECK2-NEXT:    call void (i32*, i32*, ...) bitcast (void (i32*, i32*, float*)* @.omp_outlined..10 to void (i32*, i32*, ...)*)(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], float* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[LOADGEP_F_ADDR]])
 | |
| ; CHECK2-NEXT:    [[OMP_GLOBAL_THREAD_NUM2:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB2]])
 | |
| ; CHECK2-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB3]], i32 [[OMP_GLOBAL_THREAD_NUM2]])
 | |
| ; CHECK2-NEXT:    [[OMP_GLOBAL_THREAD_NUM:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB2]])
 | |
| ; CHECK2-NEXT:    [[TMP3:%.*]] = call i32 @__kmpc_master(%struct.ident_t* @[[GLOB2]], i32 [[OMP_GLOBAL_THREAD_NUM]])
 | |
| ; CHECK2-NEXT:    [[TMP4:%.*]] = icmp ne i32 [[TMP3]], 0
 | |
| ; CHECK2-NEXT:    br i1 [[TMP4]], label [[OMP_REGION_BODY:%.*]], label [[OMP_REGION_END:%.*]]
 | |
| ; CHECK2:       omp_region.end:
 | |
| ; CHECK2-NEXT:    [[OMP_GLOBAL_THREAD_NUM1:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB2]])
 | |
| ; CHECK2-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB3]], i32 [[OMP_GLOBAL_THREAD_NUM1]])
 | |
| ; CHECK2-NEXT:    br label [[OMP_PAR_MERGED_SPLIT_SPLIT:%.*]]
 | |
| ; CHECK2:       omp.par.merged.split.split:
 | |
| ; CHECK2-NEXT:    call void (i32*, i32*, ...) bitcast (void (i32*, i32*, float*)* @.omp_outlined..11 to void (i32*, i32*, ...)*)(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], float* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[LOADGEP_F_ADDR]])
 | |
| ; CHECK2-NEXT:    br label [[ENTRY_SPLIT:%.*]]
 | |
| ; CHECK2:       entry.split:
 | |
| ; CHECK2-NEXT:    br label [[OMP_PAR_REGION_SPLIT:%.*]]
 | |
| ; CHECK2:       omp.par.region.split:
 | |
| ; CHECK2-NEXT:    br label [[OMP_PAR_PRE_FINALIZE:%.*]]
 | |
| ; CHECK2:       omp.par.pre_finalize:
 | |
| ; CHECK2-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT_EXITSTUB:%.*]]
 | |
| ; CHECK2:       omp_region.body:
 | |
| ; CHECK2-NEXT:    br label [[SEQ_PAR_MERGED:%.*]]
 | |
| ; CHECK2:       seq.par.merged:
 | |
| ; CHECK2-NEXT:    [[ADD:%.*]] = fadd float [[TMP2]], 0x40091EB860000000
 | |
| ; CHECK2-NEXT:    store float [[ADD]], float* [[LOADGEP_P]], align 4
 | |
| ; CHECK2-NEXT:    br label [[OMP_PAR_MERGED_SPLIT:%.*]]
 | |
| ; CHECK2:       omp.par.merged.split:
 | |
| ; CHECK2-NEXT:    br label [[OMP_REGION_BODY_SPLIT:%.*]]
 | |
| ; CHECK2:       omp_region.body.split:
 | |
| ; CHECK2-NEXT:    call void @__kmpc_end_master(%struct.ident_t* @[[GLOB2]], i32 [[OMP_GLOBAL_THREAD_NUM]])
 | |
| ; CHECK2-NEXT:    br label [[OMP_REGION_END]]
 | |
| ; CHECK2:       omp.par.outlined.exit.exitStub:
 | |
| ; CHECK2-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK2-LABEL: define {{[^@]+}}@.omp_outlined..10
 | |
| ; CHECK2-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], float* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[F:%.*]]) {
 | |
| ; CHECK2-NEXT:  entry:
 | |
| ; CHECK2-NEXT:    [[TMP0:%.*]] = load float, float* [[F]], align 4
 | |
| ; CHECK2-NEXT:    [[CONV:%.*]] = fptosi float [[TMP0]] to i32
 | |
| ; CHECK2-NEXT:    call void @use(i32 [[CONV]])
 | |
| ; CHECK2-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK2-LABEL: define {{[^@]+}}@.omp_outlined..11
 | |
| ; CHECK2-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], float* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[F:%.*]]) {
 | |
| ; CHECK2-NEXT:  entry:
 | |
| ; CHECK2-NEXT:    [[TMP0:%.*]] = load float, float* [[F]], align 4
 | |
| ; CHECK2-NEXT:    [[CONV:%.*]] = fptosi float [[TMP0]] to i32
 | |
| ; CHECK2-NEXT:    call void @use(i32 [[CONV]])
 | |
| ; CHECK2-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK2-LABEL: define {{[^@]+}}@merge_seq_firstprivate
 | |
| ; CHECK2-SAME: (i32 [[A:%.*]]) local_unnamed_addr {
 | |
| ; CHECK2-NEXT:  entry:
 | |
| ; CHECK2-NEXT:    [[STRUCTARG:%.*]] = alloca { i32*, i64* }, align 8
 | |
| ; CHECK2-NEXT:    [[A_CASTED_SROA_0_0_INSERT_EXT_SEQ_OUTPUT_ALLOC:%.*]] = alloca i64, align 8
 | |
| ; CHECK2-NEXT:    [[A_ADDR:%.*]] = alloca i32, align 4
 | |
| ; CHECK2-NEXT:    store i32 [[A]], i32* [[A_ADDR]], align 4
 | |
| ; CHECK2-NEXT:    [[OMP_GLOBAL_THREAD_NUM2:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB2]])
 | |
| ; CHECK2-NEXT:    br label [[OMP_PARALLEL:%.*]]
 | |
| ; CHECK2:       omp_parallel:
 | |
| ; CHECK2-NEXT:    [[GEP_A_ADDR:%.*]] = getelementptr { i32*, i64* }, { i32*, i64* }* [[STRUCTARG]], i32 0, i32 0
 | |
| ; CHECK2-NEXT:    store i32* [[A_ADDR]], i32** [[GEP_A_ADDR]], align 8
 | |
| ; CHECK2-NEXT:    [[GEP_A_CASTED_SROA_0_0_INSERT_EXT_SEQ_OUTPUT_ALLOC:%.*]] = getelementptr { i32*, i64* }, { i32*, i64* }* [[STRUCTARG]], i32 0, i32 1
 | |
| ; CHECK2-NEXT:    store i64* [[A_CASTED_SROA_0_0_INSERT_EXT_SEQ_OUTPUT_ALLOC]], i64** [[GEP_A_CASTED_SROA_0_0_INSERT_EXT_SEQ_OUTPUT_ALLOC]], align 8
 | |
| ; CHECK2-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB2]], i32 1, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, { i32*, i64* }*)* @merge_seq_firstprivate..omp_par to void (i32*, i32*, ...)*), { i32*, i64* }* [[STRUCTARG]])
 | |
| ; CHECK2-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT:%.*]]
 | |
| ; CHECK2:       omp.par.outlined.exit:
 | |
| ; CHECK2-NEXT:    br label [[OMP_PAR_EXIT_SPLIT:%.*]]
 | |
| ; CHECK2:       omp.par.exit.split:
 | |
| ; CHECK2-NEXT:    br label [[ENTRY_SPLIT_SPLIT:%.*]]
 | |
| ; CHECK2:       entry.split.split:
 | |
| ; CHECK2-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A_ADDR]], align 4
 | |
| ; CHECK2-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK2-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK2-LABEL: define {{[^@]+}}@merge_seq_firstprivate..omp_par
 | |
| ; CHECK2-SAME: (i32* noalias [[TID_ADDR:%.*]], i32* noalias [[ZERO_ADDR:%.*]], { i32*, i64* }* [[TMP0:%.*]]) #[[ATTR0]] {
 | |
| ; CHECK2-NEXT:  omp.par.entry:
 | |
| ; CHECK2-NEXT:    [[GEP_A_ADDR:%.*]] = getelementptr { i32*, i64* }, { i32*, i64* }* [[TMP0]], i32 0, i32 0
 | |
| ; CHECK2-NEXT:    [[LOADGEP_A_ADDR:%.*]] = load i32*, i32** [[GEP_A_ADDR]], align 8
 | |
| ; CHECK2-NEXT:    [[GEP_A_CASTED_SROA_0_0_INSERT_EXT_SEQ_OUTPUT_ALLOC:%.*]] = getelementptr { i32*, i64* }, { i32*, i64* }* [[TMP0]], i32 0, i32 1
 | |
| ; CHECK2-NEXT:    [[LOADGEP_A_CASTED_SROA_0_0_INSERT_EXT_SEQ_OUTPUT_ALLOC:%.*]] = load i64*, i64** [[GEP_A_CASTED_SROA_0_0_INSERT_EXT_SEQ_OUTPUT_ALLOC]], align 8
 | |
| ; CHECK2-NEXT:    [[TID_ADDR_LOCAL:%.*]] = alloca i32, align 4
 | |
| ; CHECK2-NEXT:    [[TMP1:%.*]] = load i32, i32* [[TID_ADDR]], align 4
 | |
| ; CHECK2-NEXT:    store i32 [[TMP1]], i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK2-NEXT:    [[TID:%.*]] = load i32, i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK2-NEXT:    br label [[OMP_PAR_REGION:%.*]]
 | |
| ; CHECK2:       omp.par.region:
 | |
| ; CHECK2-NEXT:    br label [[OMP_PAR_MERGED:%.*]]
 | |
| ; CHECK2:       omp.par.merged:
 | |
| ; CHECK2-NEXT:    call void (i32*, i32*, ...) bitcast (void (i32*, i32*, i32*)* @.omp_outlined..12 to void (i32*, i32*, ...)*)(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[LOADGEP_A_ADDR]])
 | |
| ; CHECK2-NEXT:    [[OMP_GLOBAL_THREAD_NUM2:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB2]])
 | |
| ; CHECK2-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB3]], i32 [[OMP_GLOBAL_THREAD_NUM2]])
 | |
| ; CHECK2-NEXT:    [[OMP_GLOBAL_THREAD_NUM:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB2]])
 | |
| ; CHECK2-NEXT:    [[TMP2:%.*]] = call i32 @__kmpc_master(%struct.ident_t* @[[GLOB2]], i32 [[OMP_GLOBAL_THREAD_NUM]])
 | |
| ; CHECK2-NEXT:    [[TMP3:%.*]] = icmp ne i32 [[TMP2]], 0
 | |
| ; CHECK2-NEXT:    br i1 [[TMP3]], label [[OMP_REGION_BODY:%.*]], label [[OMP_REGION_END:%.*]]
 | |
| ; CHECK2:       omp_region.end:
 | |
| ; CHECK2-NEXT:    [[OMP_GLOBAL_THREAD_NUM1:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB2]])
 | |
| ; CHECK2-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB3]], i32 [[OMP_GLOBAL_THREAD_NUM1]])
 | |
| ; CHECK2-NEXT:    br label [[OMP_PAR_MERGED_SPLIT_SPLIT:%.*]]
 | |
| ; CHECK2:       omp.par.merged.split.split:
 | |
| ; CHECK2-NEXT:    [[A_CASTED_SROA_0_0_INSERT_EXT_SEQ_OUTPUT_LOAD:%.*]] = load i64, i64* [[LOADGEP_A_CASTED_SROA_0_0_INSERT_EXT_SEQ_OUTPUT_ALLOC]], align 8
 | |
| ; CHECK2-NEXT:    call void (i32*, i32*, ...) bitcast (void (i32*, i32*, i64)* @.omp_outlined..13 to void (i32*, i32*, ...)*)(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i64 [[A_CASTED_SROA_0_0_INSERT_EXT_SEQ_OUTPUT_LOAD]])
 | |
| ; CHECK2-NEXT:    br label [[ENTRY_SPLIT:%.*]]
 | |
| ; CHECK2:       entry.split:
 | |
| ; CHECK2-NEXT:    br label [[OMP_PAR_REGION_SPLIT:%.*]]
 | |
| ; CHECK2:       omp.par.region.split:
 | |
| ; CHECK2-NEXT:    br label [[OMP_PAR_PRE_FINALIZE:%.*]]
 | |
| ; CHECK2:       omp.par.pre_finalize:
 | |
| ; CHECK2-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT_EXITSTUB:%.*]]
 | |
| ; CHECK2:       omp_region.body:
 | |
| ; CHECK2-NEXT:    br label [[SEQ_PAR_MERGED:%.*]]
 | |
| ; CHECK2:       seq.par.merged:
 | |
| ; CHECK2-NEXT:    [[TMP4:%.*]] = load i32, i32* [[LOADGEP_A_ADDR]], align 4
 | |
| ; CHECK2-NEXT:    [[ADD:%.*]] = add nsw i32 [[TMP4]], 1
 | |
| ; CHECK2-NEXT:    store i32 [[ADD]], i32* [[LOADGEP_A_ADDR]], align 4
 | |
| ; CHECK2-NEXT:    [[A_CASTED_SROA_0_0_INSERT_EXT:%.*]] = zext i32 [[ADD]] to i64
 | |
| ; CHECK2-NEXT:    store i64 [[A_CASTED_SROA_0_0_INSERT_EXT]], i64* [[LOADGEP_A_CASTED_SROA_0_0_INSERT_EXT_SEQ_OUTPUT_ALLOC]], align 8
 | |
| ; CHECK2-NEXT:    br label [[OMP_PAR_MERGED_SPLIT:%.*]]
 | |
| ; CHECK2:       omp.par.merged.split:
 | |
| ; CHECK2-NEXT:    br label [[OMP_REGION_BODY_SPLIT:%.*]]
 | |
| ; CHECK2:       omp_region.body.split:
 | |
| ; CHECK2-NEXT:    call void @__kmpc_end_master(%struct.ident_t* @[[GLOB2]], i32 [[OMP_GLOBAL_THREAD_NUM]])
 | |
| ; CHECK2-NEXT:    br label [[OMP_REGION_END]]
 | |
| ; CHECK2:       omp.par.outlined.exit.exitStub:
 | |
| ; CHECK2-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK2-LABEL: define {{[^@]+}}@.omp_outlined..12
 | |
| ; CHECK2-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK2-NEXT:  entry:
 | |
| ; CHECK2-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK2-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK2-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK2-LABEL: define {{[^@]+}}@.omp_outlined..13
 | |
| ; CHECK2-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i64 [[A:%.*]]) {
 | |
| ; CHECK2-NEXT:  entry:
 | |
| ; CHECK2-NEXT:    [[A_ADDR_SROA_0_0_EXTRACT_TRUNC:%.*]] = trunc i64 [[A]] to i32
 | |
| ; CHECK2-NEXT:    call void @use(i32 [[A_ADDR_SROA_0_0_EXTRACT_TRUNC]])
 | |
| ; CHECK2-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK2-LABEL: define {{[^@]+}}@merge_seq_sink_lt
 | |
| ; CHECK2-SAME: (i32 [[A:%.*]]) local_unnamed_addr {
 | |
| ; CHECK2-NEXT:  entry:
 | |
| ; CHECK2-NEXT:    [[STRUCTARG:%.*]] = alloca { i32* }, align 8
 | |
| ; CHECK2-NEXT:    [[A_ADDR:%.*]] = alloca i32, align 4
 | |
| ; CHECK2-NEXT:    store i32 [[A]], i32* [[A_ADDR]], align 4
 | |
| ; CHECK2-NEXT:    [[OMP_GLOBAL_THREAD_NUM2:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB2]])
 | |
| ; CHECK2-NEXT:    br label [[OMP_PARALLEL:%.*]]
 | |
| ; CHECK2:       omp_parallel:
 | |
| ; CHECK2-NEXT:    [[GEP_A_ADDR:%.*]] = getelementptr { i32* }, { i32* }* [[STRUCTARG]], i32 0, i32 0
 | |
| ; CHECK2-NEXT:    store i32* [[A_ADDR]], i32** [[GEP_A_ADDR]], align 8
 | |
| ; CHECK2-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB2]], i32 1, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, { i32* }*)* @merge_seq_sink_lt..omp_par to void (i32*, i32*, ...)*), { i32* }* [[STRUCTARG]])
 | |
| ; CHECK2-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT:%.*]]
 | |
| ; CHECK2:       omp.par.outlined.exit:
 | |
| ; CHECK2-NEXT:    br label [[OMP_PAR_EXIT_SPLIT:%.*]]
 | |
| ; CHECK2:       omp.par.exit.split:
 | |
| ; CHECK2-NEXT:    br label [[ENTRY_SPLIT_SPLIT:%.*]]
 | |
| ; CHECK2:       entry.split.split:
 | |
| ; CHECK2-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK2-LABEL: define {{[^@]+}}@merge_seq_sink_lt..omp_par
 | |
| ; CHECK2-SAME: (i32* noalias [[TID_ADDR:%.*]], i32* noalias [[ZERO_ADDR:%.*]], { i32* }* [[TMP0:%.*]]) #[[ATTR0]] {
 | |
| ; CHECK2-NEXT:  omp.par.entry:
 | |
| ; CHECK2-NEXT:    [[B:%.*]] = alloca i32, align 4
 | |
| ; CHECK2-NEXT:    [[GEP_A_ADDR:%.*]] = getelementptr { i32* }, { i32* }* [[TMP0]], i32 0, i32 0
 | |
| ; CHECK2-NEXT:    [[LOADGEP_A_ADDR:%.*]] = load i32*, i32** [[GEP_A_ADDR]], align 8
 | |
| ; CHECK2-NEXT:    [[TID_ADDR_LOCAL:%.*]] = alloca i32, align 4
 | |
| ; CHECK2-NEXT:    [[TMP1:%.*]] = load i32, i32* [[TID_ADDR]], align 4
 | |
| ; CHECK2-NEXT:    store i32 [[TMP1]], i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK2-NEXT:    [[TID:%.*]] = load i32, i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK2-NEXT:    br label [[OMP_PAR_REGION:%.*]]
 | |
| ; CHECK2:       omp.par.region:
 | |
| ; CHECK2-NEXT:    br label [[OMP_PAR_MERGED:%.*]]
 | |
| ; CHECK2:       omp.par.merged:
 | |
| ; CHECK2-NEXT:    call void (i32*, i32*, ...) bitcast (void (i32*, i32*, i32*)* @.omp_outlined..14 to void (i32*, i32*, ...)*)(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[LOADGEP_A_ADDR]])
 | |
| ; CHECK2-NEXT:    [[OMP_GLOBAL_THREAD_NUM2:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB2]])
 | |
| ; CHECK2-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB3]], i32 [[OMP_GLOBAL_THREAD_NUM2]])
 | |
| ; CHECK2-NEXT:    [[OMP_GLOBAL_THREAD_NUM:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB2]])
 | |
| ; CHECK2-NEXT:    [[TMP2:%.*]] = call i32 @__kmpc_master(%struct.ident_t* @[[GLOB2]], i32 [[OMP_GLOBAL_THREAD_NUM]])
 | |
| ; CHECK2-NEXT:    [[TMP3:%.*]] = icmp ne i32 [[TMP2]], 0
 | |
| ; CHECK2-NEXT:    br i1 [[TMP3]], label [[OMP_REGION_BODY:%.*]], label [[OMP_REGION_END:%.*]]
 | |
| ; CHECK2:       omp_region.end:
 | |
| ; CHECK2-NEXT:    [[OMP_GLOBAL_THREAD_NUM1:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB2]])
 | |
| ; CHECK2-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB3]], i32 [[OMP_GLOBAL_THREAD_NUM1]])
 | |
| ; CHECK2-NEXT:    br label [[OMP_PAR_MERGED_SPLIT_SPLIT:%.*]]
 | |
| ; CHECK2:       omp.par.merged.split.split:
 | |
| ; CHECK2-NEXT:    call void (i32*, i32*, ...) bitcast (void (i32*, i32*, i32*)* @.omp_outlined..15 to void (i32*, i32*, ...)*)(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[LOADGEP_A_ADDR]])
 | |
| ; CHECK2-NEXT:    br label [[ENTRY_SPLIT:%.*]]
 | |
| ; CHECK2:       entry.split:
 | |
| ; CHECK2-NEXT:    br label [[OMP_PAR_REGION_SPLIT:%.*]]
 | |
| ; CHECK2:       omp.par.region.split:
 | |
| ; CHECK2-NEXT:    br label [[OMP_PAR_PRE_FINALIZE:%.*]]
 | |
| ; CHECK2:       omp.par.pre_finalize:
 | |
| ; CHECK2-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT_EXITSTUB:%.*]]
 | |
| ; CHECK2:       omp_region.body:
 | |
| ; CHECK2-NEXT:    br label [[SEQ_PAR_MERGED:%.*]]
 | |
| ; CHECK2:       seq.par.merged:
 | |
| ; CHECK2-NEXT:    [[TMP4:%.*]] = bitcast i32* [[B]] to i8*
 | |
| ; CHECK2-NEXT:    call void @llvm.lifetime.start.p0i8(i64 noundef 4, i8* noundef nonnull [[TMP4]])
 | |
| ; CHECK2-NEXT:    [[TMP5:%.*]] = ptrtoint i32* [[B]] to i64
 | |
| ; CHECK2-NEXT:    [[TMP6:%.*]] = trunc i64 [[TMP5]] to i32
 | |
| ; CHECK2-NEXT:    call void @llvm.lifetime.end.p0i8(i64 noundef 4, i8* noundef nonnull [[TMP4]])
 | |
| ; CHECK2-NEXT:    br label [[OMP_PAR_MERGED_SPLIT:%.*]]
 | |
| ; CHECK2:       omp.par.merged.split:
 | |
| ; CHECK2-NEXT:    br label [[OMP_REGION_BODY_SPLIT:%.*]]
 | |
| ; CHECK2:       omp_region.body.split:
 | |
| ; CHECK2-NEXT:    call void @__kmpc_end_master(%struct.ident_t* @[[GLOB2]], i32 [[OMP_GLOBAL_THREAD_NUM]])
 | |
| ; CHECK2-NEXT:    br label [[OMP_REGION_END]]
 | |
| ; CHECK2:       omp.par.outlined.exit.exitStub:
 | |
| ; CHECK2-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK2-LABEL: define {{[^@]+}}@.omp_outlined..14
 | |
| ; CHECK2-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK2-NEXT:  entry:
 | |
| ; CHECK2-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK2-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK2-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK2-LABEL: define {{[^@]+}}@.omp_outlined..15
 | |
| ; CHECK2-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK2-NEXT:  entry:
 | |
| ; CHECK2-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK2-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK2-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK2-LABEL: define {{[^@]+}}@merge_seq_par_use
 | |
| ; CHECK2-SAME: (i32 [[A:%.*]]) local_unnamed_addr {
 | |
| ; CHECK2-NEXT:  entry:
 | |
| ; CHECK2-NEXT:    [[STRUCTARG:%.*]] = alloca { i32*, i32*, i32* }, align 8
 | |
| ; CHECK2-NEXT:    [[A_RELOADED:%.*]] = alloca i32, align 4
 | |
| ; CHECK2-NEXT:    [[A_ADDR:%.*]] = alloca i32, align 4
 | |
| ; CHECK2-NEXT:    [[B:%.*]] = alloca i32, align 4
 | |
| ; CHECK2-NEXT:    store i32 [[A]], i32* [[A_ADDR]], align 4
 | |
| ; CHECK2-NEXT:    [[OMP_GLOBAL_THREAD_NUM2:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB2]])
 | |
| ; CHECK2-NEXT:    store i32 [[A]], i32* [[A_RELOADED]], align 4
 | |
| ; CHECK2-NEXT:    br label [[OMP_PARALLEL:%.*]]
 | |
| ; CHECK2:       omp_parallel:
 | |
| ; CHECK2-NEXT:    [[GEP_A_RELOADED:%.*]] = getelementptr { i32*, i32*, i32* }, { i32*, i32*, i32* }* [[STRUCTARG]], i32 0, i32 0
 | |
| ; CHECK2-NEXT:    store i32* [[A_RELOADED]], i32** [[GEP_A_RELOADED]], align 8
 | |
| ; CHECK2-NEXT:    [[GEP_A_ADDR:%.*]] = getelementptr { i32*, i32*, i32* }, { i32*, i32*, i32* }* [[STRUCTARG]], i32 0, i32 1
 | |
| ; CHECK2-NEXT:    store i32* [[A_ADDR]], i32** [[GEP_A_ADDR]], align 8
 | |
| ; CHECK2-NEXT:    [[GEP_B:%.*]] = getelementptr { i32*, i32*, i32* }, { i32*, i32*, i32* }* [[STRUCTARG]], i32 0, i32 2
 | |
| ; CHECK2-NEXT:    store i32* [[B]], i32** [[GEP_B]], align 8
 | |
| ; CHECK2-NEXT:    [[LT_CAST3:%.*]] = bitcast i32* [[B]] to i8*
 | |
| ; CHECK2-NEXT:    call void @llvm.lifetime.start.p0i8(i64 -1, i8* [[LT_CAST3]])
 | |
| ; CHECK2-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB2]], i32 1, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, { i32*, i32*, i32* }*)* @merge_seq_par_use..omp_par to void (i32*, i32*, ...)*), { i32*, i32*, i32* }* [[STRUCTARG]])
 | |
| ; CHECK2-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT:%.*]]
 | |
| ; CHECK2:       omp.par.outlined.exit:
 | |
| ; CHECK2-NEXT:    br label [[OMP_PAR_EXIT_SPLIT:%.*]]
 | |
| ; CHECK2:       omp.par.exit.split:
 | |
| ; CHECK2-NEXT:    br label [[ENTRY_SPLIT_SPLIT:%.*]]
 | |
| ; CHECK2:       entry.split.split:
 | |
| ; CHECK2-NEXT:    [[LT_CAST:%.*]] = bitcast i32* [[B]] to i8*
 | |
| ; CHECK2-NEXT:    call void @llvm.lifetime.end.p0i8(i64 noundef 4, i8* noundef nonnull [[LT_CAST]])
 | |
| ; CHECK2-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK2-LABEL: define {{[^@]+}}@merge_seq_par_use..omp_par
 | |
| ; CHECK2-SAME: (i32* noalias [[TID_ADDR:%.*]], i32* noalias [[ZERO_ADDR:%.*]], { i32*, i32*, i32* }* [[TMP0:%.*]]) #[[ATTR0]] {
 | |
| ; CHECK2-NEXT:  omp.par.entry:
 | |
| ; CHECK2-NEXT:    [[GEP_A_RELOADED:%.*]] = getelementptr { i32*, i32*, i32* }, { i32*, i32*, i32* }* [[TMP0]], i32 0, i32 0
 | |
| ; CHECK2-NEXT:    [[LOADGEP_A_RELOADED:%.*]] = load i32*, i32** [[GEP_A_RELOADED]], align 8
 | |
| ; CHECK2-NEXT:    [[GEP_A_ADDR:%.*]] = getelementptr { i32*, i32*, i32* }, { i32*, i32*, i32* }* [[TMP0]], i32 0, i32 1
 | |
| ; CHECK2-NEXT:    [[LOADGEP_A_ADDR:%.*]] = load i32*, i32** [[GEP_A_ADDR]], align 8
 | |
| ; CHECK2-NEXT:    [[GEP_B:%.*]] = getelementptr { i32*, i32*, i32* }, { i32*, i32*, i32* }* [[TMP0]], i32 0, i32 2
 | |
| ; CHECK2-NEXT:    [[LOADGEP_B:%.*]] = load i32*, i32** [[GEP_B]], align 8
 | |
| ; CHECK2-NEXT:    [[TID_ADDR_LOCAL:%.*]] = alloca i32, align 4
 | |
| ; CHECK2-NEXT:    [[TMP1:%.*]] = load i32, i32* [[TID_ADDR]], align 4
 | |
| ; CHECK2-NEXT:    store i32 [[TMP1]], i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK2-NEXT:    [[TID:%.*]] = load i32, i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK2-NEXT:    [[TMP2:%.*]] = load i32, i32* [[LOADGEP_A_RELOADED]], align 4
 | |
| ; CHECK2-NEXT:    br label [[OMP_PAR_REGION:%.*]]
 | |
| ; CHECK2:       omp.par.region:
 | |
| ; CHECK2-NEXT:    br label [[OMP_PAR_MERGED:%.*]]
 | |
| ; CHECK2:       omp.par.merged:
 | |
| ; CHECK2-NEXT:    call void (i32*, i32*, ...) bitcast (void (i32*, i32*, i32*)* @.omp_outlined..16 to void (i32*, i32*, ...)*)(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[LOADGEP_A_ADDR]])
 | |
| ; CHECK2-NEXT:    [[OMP_GLOBAL_THREAD_NUM2:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB2]])
 | |
| ; CHECK2-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB3]], i32 [[OMP_GLOBAL_THREAD_NUM2]])
 | |
| ; CHECK2-NEXT:    [[OMP_GLOBAL_THREAD_NUM:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB2]])
 | |
| ; CHECK2-NEXT:    [[TMP3:%.*]] = call i32 @__kmpc_master(%struct.ident_t* @[[GLOB2]], i32 [[OMP_GLOBAL_THREAD_NUM]])
 | |
| ; CHECK2-NEXT:    [[TMP4:%.*]] = icmp ne i32 [[TMP3]], 0
 | |
| ; CHECK2-NEXT:    br i1 [[TMP4]], label [[OMP_REGION_BODY:%.*]], label [[OMP_REGION_END:%.*]]
 | |
| ; CHECK2:       omp_region.end:
 | |
| ; CHECK2-NEXT:    [[OMP_GLOBAL_THREAD_NUM1:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB2]])
 | |
| ; CHECK2-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB3]], i32 [[OMP_GLOBAL_THREAD_NUM1]])
 | |
| ; CHECK2-NEXT:    br label [[OMP_PAR_MERGED_SPLIT_SPLIT:%.*]]
 | |
| ; CHECK2:       omp.par.merged.split.split:
 | |
| ; CHECK2-NEXT:    call void (i32*, i32*, ...) bitcast (void (i32*, i32*, i32*, i32*)* @.omp_outlined..17 to void (i32*, i32*, ...)*)(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[LOADGEP_A_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[LOADGEP_B]])
 | |
| ; CHECK2-NEXT:    br label [[ENTRY_SPLIT:%.*]]
 | |
| ; CHECK2:       entry.split:
 | |
| ; CHECK2-NEXT:    br label [[OMP_PAR_REGION_SPLIT:%.*]]
 | |
| ; CHECK2:       omp.par.region.split:
 | |
| ; CHECK2-NEXT:    br label [[OMP_PAR_PRE_FINALIZE:%.*]]
 | |
| ; CHECK2:       omp.par.pre_finalize:
 | |
| ; CHECK2-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT_EXITSTUB:%.*]]
 | |
| ; CHECK2:       omp_region.body:
 | |
| ; CHECK2-NEXT:    br label [[SEQ_PAR_MERGED:%.*]]
 | |
| ; CHECK2:       seq.par.merged:
 | |
| ; CHECK2-NEXT:    [[TMP5:%.*]] = bitcast i32* [[LOADGEP_B]] to i8*
 | |
| ; CHECK2-NEXT:    [[ADD:%.*]] = add nsw i32 [[TMP2]], 1
 | |
| ; CHECK2-NEXT:    store i32 [[ADD]], i32* [[LOADGEP_B]], align 4
 | |
| ; CHECK2-NEXT:    br label [[OMP_PAR_MERGED_SPLIT:%.*]]
 | |
| ; CHECK2:       omp.par.merged.split:
 | |
| ; CHECK2-NEXT:    br label [[OMP_REGION_BODY_SPLIT:%.*]]
 | |
| ; CHECK2:       omp_region.body.split:
 | |
| ; CHECK2-NEXT:    call void @__kmpc_end_master(%struct.ident_t* @[[GLOB2]], i32 [[OMP_GLOBAL_THREAD_NUM]])
 | |
| ; CHECK2-NEXT:    br label [[OMP_REGION_END]]
 | |
| ; CHECK2:       omp.par.outlined.exit.exitStub:
 | |
| ; CHECK2-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK2-LABEL: define {{[^@]+}}@.omp_outlined..16
 | |
| ; CHECK2-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK2-NEXT:  entry:
 | |
| ; CHECK2-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK2-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK2-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK2-LABEL: define {{[^@]+}}@.omp_outlined..17
 | |
| ; CHECK2-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[B:%.*]]) {
 | |
| ; CHECK2-NEXT:  entry:
 | |
| ; CHECK2-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK2-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK2-NEXT:    [[TMP1:%.*]] = load i32, i32* [[B]], align 4
 | |
| ; CHECK2-NEXT:    call void @use(i32 [[TMP1]])
 | |
| ; CHECK2-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK2-LABEL: define {{[^@]+}}@merge_cancellable_regions
 | |
| ; CHECK2-SAME: (i32 [[CANCEL1:%.*]], i32 [[CANCEL2:%.*]]) local_unnamed_addr {
 | |
| ; CHECK2-NEXT:  entry:
 | |
| ; CHECK2-NEXT:    [[STRUCTARG:%.*]] = alloca { i32*, i32* }, align 8
 | |
| ; CHECK2-NEXT:    [[CANCEL1_ADDR:%.*]] = alloca i32, align 4
 | |
| ; CHECK2-NEXT:    [[CANCEL2_ADDR:%.*]] = alloca i32, align 4
 | |
| ; CHECK2-NEXT:    store i32 [[CANCEL1]], i32* [[CANCEL1_ADDR]], align 4
 | |
| ; CHECK2-NEXT:    store i32 [[CANCEL2]], i32* [[CANCEL2_ADDR]], align 4
 | |
| ; CHECK2-NEXT:    [[OMP_GLOBAL_THREAD_NUM:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB2]])
 | |
| ; CHECK2-NEXT:    br label [[OMP_PARALLEL:%.*]]
 | |
| ; CHECK2:       omp_parallel:
 | |
| ; CHECK2-NEXT:    [[GEP_CANCEL1_ADDR:%.*]] = getelementptr { i32*, i32* }, { i32*, i32* }* [[STRUCTARG]], i32 0, i32 0
 | |
| ; CHECK2-NEXT:    store i32* [[CANCEL1_ADDR]], i32** [[GEP_CANCEL1_ADDR]], align 8
 | |
| ; CHECK2-NEXT:    [[GEP_CANCEL2_ADDR:%.*]] = getelementptr { i32*, i32* }, { i32*, i32* }* [[STRUCTARG]], i32 0, i32 1
 | |
| ; CHECK2-NEXT:    store i32* [[CANCEL2_ADDR]], i32** [[GEP_CANCEL2_ADDR]], align 8
 | |
| ; CHECK2-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB2]], i32 1, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, { i32*, i32* }*)* @merge_cancellable_regions..omp_par to void (i32*, i32*, ...)*), { i32*, i32* }* [[STRUCTARG]])
 | |
| ; CHECK2-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT:%.*]]
 | |
| ; CHECK2:       omp.par.outlined.exit:
 | |
| ; CHECK2-NEXT:    br label [[OMP_PAR_EXIT_SPLIT:%.*]]
 | |
| ; CHECK2:       omp.par.exit.split:
 | |
| ; CHECK2-NEXT:    br label [[ENTRY_SPLIT_SPLIT:%.*]]
 | |
| ; CHECK2:       entry.split.split:
 | |
| ; CHECK2-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK2-LABEL: define {{[^@]+}}@merge_cancellable_regions..omp_par
 | |
| ; CHECK2-SAME: (i32* noalias [[TID_ADDR:%.*]], i32* noalias [[ZERO_ADDR:%.*]], { i32*, i32* }* [[TMP0:%.*]]) #[[ATTR0]] {
 | |
| ; CHECK2-NEXT:  omp.par.entry:
 | |
| ; CHECK2-NEXT:    [[GEP_CANCEL1_ADDR:%.*]] = getelementptr { i32*, i32* }, { i32*, i32* }* [[TMP0]], i32 0, i32 0
 | |
| ; CHECK2-NEXT:    [[LOADGEP_CANCEL1_ADDR:%.*]] = load i32*, i32** [[GEP_CANCEL1_ADDR]], align 8
 | |
| ; CHECK2-NEXT:    [[GEP_CANCEL2_ADDR:%.*]] = getelementptr { i32*, i32* }, { i32*, i32* }* [[TMP0]], i32 0, i32 1
 | |
| ; CHECK2-NEXT:    [[LOADGEP_CANCEL2_ADDR:%.*]] = load i32*, i32** [[GEP_CANCEL2_ADDR]], align 8
 | |
| ; CHECK2-NEXT:    [[TID_ADDR_LOCAL:%.*]] = alloca i32, align 4
 | |
| ; CHECK2-NEXT:    [[TMP1:%.*]] = load i32, i32* [[TID_ADDR]], align 4
 | |
| ; CHECK2-NEXT:    store i32 [[TMP1]], i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK2-NEXT:    [[TID:%.*]] = load i32, i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK2-NEXT:    br label [[OMP_PAR_REGION:%.*]]
 | |
| ; CHECK2:       omp.par.region:
 | |
| ; CHECK2-NEXT:    br label [[OMP_PAR_MERGED:%.*]]
 | |
| ; CHECK2:       omp.par.merged:
 | |
| ; CHECK2-NEXT:    call void (i32*, i32*, ...) bitcast (void (i32*, i32*, i32*)* @.omp_outlined..18 to void (i32*, i32*, ...)*)(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[LOADGEP_CANCEL1_ADDR]])
 | |
| ; CHECK2-NEXT:    [[OMP_GLOBAL_THREAD_NUM:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB2]])
 | |
| ; CHECK2-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB3]], i32 [[OMP_GLOBAL_THREAD_NUM]])
 | |
| ; CHECK2-NEXT:    call void (i32*, i32*, ...) bitcast (void (i32*, i32*, i32*)* @.omp_outlined..19 to void (i32*, i32*, ...)*)(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[LOADGEP_CANCEL2_ADDR]])
 | |
| ; CHECK2-NEXT:    br label [[ENTRY_SPLIT:%.*]]
 | |
| ; CHECK2:       entry.split:
 | |
| ; CHECK2-NEXT:    br label [[OMP_PAR_REGION_SPLIT:%.*]]
 | |
| ; CHECK2:       omp.par.region.split:
 | |
| ; CHECK2-NEXT:    br label [[OMP_PAR_PRE_FINALIZE:%.*]]
 | |
| ; CHECK2:       omp.par.pre_finalize:
 | |
| ; CHECK2-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT_EXITSTUB:%.*]]
 | |
| ; CHECK2:       omp.par.outlined.exit.exitStub:
 | |
| ; CHECK2-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK2-LABEL: define {{[^@]+}}@.omp_outlined..18
 | |
| ; CHECK2-SAME: (i32* noalias nocapture nofree readonly [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[CANCEL1:%.*]]) {
 | |
| ; CHECK2-NEXT:  entry:
 | |
| ; CHECK2-NEXT:    [[TMP0:%.*]] = load i32, i32* [[CANCEL1]], align 4
 | |
| ; CHECK2-NEXT:    [[TOBOOL_NOT:%.*]] = icmp eq i32 [[TMP0]], 0
 | |
| ; CHECK2-NEXT:    br i1 [[TOBOOL_NOT]], label [[IF_END:%.*]], label [[IF_THEN:%.*]]
 | |
| ; CHECK2:       if.then:
 | |
| ; CHECK2-NEXT:    [[TMP1:%.*]] = load i32, i32* [[DOTGLOBAL_TID_]], align 4
 | |
| ; CHECK2-NEXT:    [[TMP2:%.*]] = call i32 @__kmpc_cancel(%struct.ident_t* noundef nonnull @[[GLOB1]], i32 [[TMP1]], i32 noundef 1)
 | |
| ; CHECK2-NEXT:    ret void
 | |
| ; CHECK2:       if.end:
 | |
| ; CHECK2-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK2-LABEL: define {{[^@]+}}@.omp_outlined..19
 | |
| ; CHECK2-SAME: (i32* noalias nocapture nofree readonly [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[CANCEL2:%.*]]) {
 | |
| ; CHECK2-NEXT:  entry:
 | |
| ; CHECK2-NEXT:    [[TMP0:%.*]] = load i32, i32* [[CANCEL2]], align 4
 | |
| ; CHECK2-NEXT:    [[TOBOOL_NOT:%.*]] = icmp eq i32 [[TMP0]], 0
 | |
| ; CHECK2-NEXT:    br i1 [[TOBOOL_NOT]], label [[IF_END:%.*]], label [[IF_THEN:%.*]]
 | |
| ; CHECK2:       if.then:
 | |
| ; CHECK2-NEXT:    [[TMP1:%.*]] = load i32, i32* [[DOTGLOBAL_TID_]], align 4
 | |
| ; CHECK2-NEXT:    [[TMP2:%.*]] = call i32 @__kmpc_cancel(%struct.ident_t* noundef nonnull @[[GLOB1]], i32 [[TMP1]], i32 noundef 1)
 | |
| ; CHECK2-NEXT:    ret void
 | |
| ; CHECK2:       if.end:
 | |
| ; CHECK2-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK2-LABEL: define {{[^@]+}}@merge_cancellable_regions_seq
 | |
| ; CHECK2-SAME: (i32 [[CANCEL1:%.*]], i32 [[CANCEL2:%.*]]) local_unnamed_addr {
 | |
| ; CHECK2-NEXT:  entry:
 | |
| ; CHECK2-NEXT:    [[STRUCTARG:%.*]] = alloca { i32*, i32*, i32* }, align 8
 | |
| ; CHECK2-NEXT:    [[CANCEL1_RELOADED:%.*]] = alloca i32, align 4
 | |
| ; CHECK2-NEXT:    [[CANCEL1_ADDR:%.*]] = alloca i32, align 4
 | |
| ; CHECK2-NEXT:    [[CANCEL2_ADDR:%.*]] = alloca i32, align 4
 | |
| ; CHECK2-NEXT:    store i32 [[CANCEL1]], i32* [[CANCEL1_ADDR]], align 4
 | |
| ; CHECK2-NEXT:    store i32 [[CANCEL2]], i32* [[CANCEL2_ADDR]], align 4
 | |
| ; CHECK2-NEXT:    [[OMP_GLOBAL_THREAD_NUM2:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB2]])
 | |
| ; CHECK2-NEXT:    store i32 [[CANCEL1]], i32* [[CANCEL1_RELOADED]], align 4
 | |
| ; CHECK2-NEXT:    br label [[OMP_PARALLEL:%.*]]
 | |
| ; CHECK2:       omp_parallel:
 | |
| ; CHECK2-NEXT:    [[GEP_CANCEL1_RELOADED:%.*]] = getelementptr { i32*, i32*, i32* }, { i32*, i32*, i32* }* [[STRUCTARG]], i32 0, i32 0
 | |
| ; CHECK2-NEXT:    store i32* [[CANCEL1_RELOADED]], i32** [[GEP_CANCEL1_RELOADED]], align 8
 | |
| ; CHECK2-NEXT:    [[GEP_CANCEL1_ADDR:%.*]] = getelementptr { i32*, i32*, i32* }, { i32*, i32*, i32* }* [[STRUCTARG]], i32 0, i32 1
 | |
| ; CHECK2-NEXT:    store i32* [[CANCEL1_ADDR]], i32** [[GEP_CANCEL1_ADDR]], align 8
 | |
| ; CHECK2-NEXT:    [[GEP_CANCEL2_ADDR:%.*]] = getelementptr { i32*, i32*, i32* }, { i32*, i32*, i32* }* [[STRUCTARG]], i32 0, i32 2
 | |
| ; CHECK2-NEXT:    store i32* [[CANCEL2_ADDR]], i32** [[GEP_CANCEL2_ADDR]], align 8
 | |
| ; CHECK2-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB2]], i32 1, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, { i32*, i32*, i32* }*)* @merge_cancellable_regions_seq..omp_par to void (i32*, i32*, ...)*), { i32*, i32*, i32* }* [[STRUCTARG]])
 | |
| ; CHECK2-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT:%.*]]
 | |
| ; CHECK2:       omp.par.outlined.exit:
 | |
| ; CHECK2-NEXT:    br label [[OMP_PAR_EXIT_SPLIT:%.*]]
 | |
| ; CHECK2:       omp.par.exit.split:
 | |
| ; CHECK2-NEXT:    br label [[ENTRY_SPLIT_SPLIT:%.*]]
 | |
| ; CHECK2:       entry.split.split:
 | |
| ; CHECK2-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK2-LABEL: define {{[^@]+}}@merge_cancellable_regions_seq..omp_par
 | |
| ; CHECK2-SAME: (i32* noalias [[TID_ADDR:%.*]], i32* noalias [[ZERO_ADDR:%.*]], { i32*, i32*, i32* }* [[TMP0:%.*]]) #[[ATTR0]] {
 | |
| ; CHECK2-NEXT:  omp.par.entry:
 | |
| ; CHECK2-NEXT:    [[GEP_CANCEL1_RELOADED:%.*]] = getelementptr { i32*, i32*, i32* }, { i32*, i32*, i32* }* [[TMP0]], i32 0, i32 0
 | |
| ; CHECK2-NEXT:    [[LOADGEP_CANCEL1_RELOADED:%.*]] = load i32*, i32** [[GEP_CANCEL1_RELOADED]], align 8
 | |
| ; CHECK2-NEXT:    [[GEP_CANCEL1_ADDR:%.*]] = getelementptr { i32*, i32*, i32* }, { i32*, i32*, i32* }* [[TMP0]], i32 0, i32 1
 | |
| ; CHECK2-NEXT:    [[LOADGEP_CANCEL1_ADDR:%.*]] = load i32*, i32** [[GEP_CANCEL1_ADDR]], align 8
 | |
| ; CHECK2-NEXT:    [[GEP_CANCEL2_ADDR:%.*]] = getelementptr { i32*, i32*, i32* }, { i32*, i32*, i32* }* [[TMP0]], i32 0, i32 2
 | |
| ; CHECK2-NEXT:    [[LOADGEP_CANCEL2_ADDR:%.*]] = load i32*, i32** [[GEP_CANCEL2_ADDR]], align 8
 | |
| ; CHECK2-NEXT:    [[TID_ADDR_LOCAL:%.*]] = alloca i32, align 4
 | |
| ; CHECK2-NEXT:    [[TMP1:%.*]] = load i32, i32* [[TID_ADDR]], align 4
 | |
| ; CHECK2-NEXT:    store i32 [[TMP1]], i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK2-NEXT:    [[TID:%.*]] = load i32, i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK2-NEXT:    [[TMP2:%.*]] = load i32, i32* [[LOADGEP_CANCEL1_RELOADED]], align 4
 | |
| ; CHECK2-NEXT:    br label [[OMP_PAR_REGION:%.*]]
 | |
| ; CHECK2:       omp.par.region:
 | |
| ; CHECK2-NEXT:    br label [[OMP_PAR_MERGED:%.*]]
 | |
| ; CHECK2:       omp.par.merged:
 | |
| ; CHECK2-NEXT:    call void (i32*, i32*, ...) bitcast (void (i32*, i32*, i32*)* @.omp_outlined..20 to void (i32*, i32*, ...)*)(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[LOADGEP_CANCEL1_ADDR]])
 | |
| ; CHECK2-NEXT:    [[OMP_GLOBAL_THREAD_NUM2:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB2]])
 | |
| ; CHECK2-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB3]], i32 [[OMP_GLOBAL_THREAD_NUM2]])
 | |
| ; CHECK2-NEXT:    [[OMP_GLOBAL_THREAD_NUM:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB2]])
 | |
| ; CHECK2-NEXT:    [[TMP3:%.*]] = call i32 @__kmpc_master(%struct.ident_t* @[[GLOB2]], i32 [[OMP_GLOBAL_THREAD_NUM]])
 | |
| ; CHECK2-NEXT:    [[TMP4:%.*]] = icmp ne i32 [[TMP3]], 0
 | |
| ; CHECK2-NEXT:    br i1 [[TMP4]], label [[OMP_REGION_BODY:%.*]], label [[OMP_REGION_END:%.*]]
 | |
| ; CHECK2:       omp_region.end:
 | |
| ; CHECK2-NEXT:    [[OMP_GLOBAL_THREAD_NUM1:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB2]])
 | |
| ; CHECK2-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB3]], i32 [[OMP_GLOBAL_THREAD_NUM1]])
 | |
| ; CHECK2-NEXT:    br label [[OMP_PAR_MERGED_SPLIT_SPLIT:%.*]]
 | |
| ; CHECK2:       omp.par.merged.split.split:
 | |
| ; CHECK2-NEXT:    call void (i32*, i32*, ...) bitcast (void (i32*, i32*, i32*)* @.omp_outlined..21 to void (i32*, i32*, ...)*)(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[LOADGEP_CANCEL2_ADDR]])
 | |
| ; CHECK2-NEXT:    br label [[ENTRY_SPLIT:%.*]]
 | |
| ; CHECK2:       entry.split:
 | |
| ; CHECK2-NEXT:    br label [[OMP_PAR_REGION_SPLIT:%.*]]
 | |
| ; CHECK2:       omp.par.region.split:
 | |
| ; CHECK2-NEXT:    br label [[OMP_PAR_PRE_FINALIZE:%.*]]
 | |
| ; CHECK2:       omp.par.pre_finalize:
 | |
| ; CHECK2-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT_EXITSTUB:%.*]]
 | |
| ; CHECK2:       omp_region.body:
 | |
| ; CHECK2-NEXT:    br label [[SEQ_PAR_MERGED:%.*]]
 | |
| ; CHECK2:       seq.par.merged:
 | |
| ; CHECK2-NEXT:    [[TOBOOL_NOT:%.*]] = icmp eq i32 [[TMP2]], 0
 | |
| ; CHECK2-NEXT:    [[LNOT_EXT:%.*]] = zext i1 [[TOBOOL_NOT]] to i32
 | |
| ; CHECK2-NEXT:    store i32 [[LNOT_EXT]], i32* [[LOADGEP_CANCEL2_ADDR]], align 4
 | |
| ; CHECK2-NEXT:    br label [[OMP_PAR_MERGED_SPLIT:%.*]]
 | |
| ; CHECK2:       omp.par.merged.split:
 | |
| ; CHECK2-NEXT:    br label [[OMP_REGION_BODY_SPLIT:%.*]]
 | |
| ; CHECK2:       omp_region.body.split:
 | |
| ; CHECK2-NEXT:    call void @__kmpc_end_master(%struct.ident_t* @[[GLOB2]], i32 [[OMP_GLOBAL_THREAD_NUM]])
 | |
| ; CHECK2-NEXT:    br label [[OMP_REGION_END]]
 | |
| ; CHECK2:       omp.par.outlined.exit.exitStub:
 | |
| ; CHECK2-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK2-LABEL: define {{[^@]+}}@.omp_outlined..20
 | |
| ; CHECK2-SAME: (i32* noalias nocapture nofree readonly [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[CANCEL1:%.*]]) {
 | |
| ; CHECK2-NEXT:  entry:
 | |
| ; CHECK2-NEXT:    [[TMP0:%.*]] = load i32, i32* [[CANCEL1]], align 4
 | |
| ; CHECK2-NEXT:    [[TOBOOL_NOT:%.*]] = icmp eq i32 [[TMP0]], 0
 | |
| ; CHECK2-NEXT:    br i1 [[TOBOOL_NOT]], label [[IF_END:%.*]], label [[IF_THEN:%.*]]
 | |
| ; CHECK2:       if.then:
 | |
| ; CHECK2-NEXT:    [[TMP1:%.*]] = load i32, i32* [[DOTGLOBAL_TID_]], align 4
 | |
| ; CHECK2-NEXT:    [[TMP2:%.*]] = call i32 @__kmpc_cancel(%struct.ident_t* noundef nonnull @[[GLOB1]], i32 [[TMP1]], i32 noundef 1)
 | |
| ; CHECK2-NEXT:    ret void
 | |
| ; CHECK2:       if.end:
 | |
| ; CHECK2-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK2-LABEL: define {{[^@]+}}@.omp_outlined..21
 | |
| ; CHECK2-SAME: (i32* noalias nocapture nofree readonly [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[CANCEL2:%.*]]) {
 | |
| ; CHECK2-NEXT:  entry:
 | |
| ; CHECK2-NEXT:    [[TMP0:%.*]] = load i32, i32* [[CANCEL2]], align 4
 | |
| ; CHECK2-NEXT:    [[TOBOOL_NOT:%.*]] = icmp eq i32 [[TMP0]], 0
 | |
| ; CHECK2-NEXT:    br i1 [[TOBOOL_NOT]], label [[IF_END:%.*]], label [[IF_THEN:%.*]]
 | |
| ; CHECK2:       if.then:
 | |
| ; CHECK2-NEXT:    [[TMP1:%.*]] = load i32, i32* [[DOTGLOBAL_TID_]], align 4
 | |
| ; CHECK2-NEXT:    [[TMP2:%.*]] = call i32 @__kmpc_cancel(%struct.ident_t* noundef nonnull @[[GLOB1]], i32 [[TMP1]], i32 noundef 1)
 | |
| ; CHECK2-NEXT:    ret void
 | |
| ; CHECK2:       if.end:
 | |
| ; CHECK2-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK2-LABEL: define {{[^@]+}}@merge_3
 | |
| ; CHECK2-SAME: (i32 [[A:%.*]]) local_unnamed_addr {
 | |
| ; CHECK2-NEXT:  entry:
 | |
| ; CHECK2-NEXT:    [[STRUCTARG:%.*]] = alloca { i32* }, align 8
 | |
| ; CHECK2-NEXT:    [[A_ADDR:%.*]] = alloca i32, align 4
 | |
| ; CHECK2-NEXT:    store i32 [[A]], i32* [[A_ADDR]], align 4
 | |
| ; CHECK2-NEXT:    [[OMP_GLOBAL_THREAD_NUM:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB2]])
 | |
| ; CHECK2-NEXT:    br label [[OMP_PARALLEL:%.*]]
 | |
| ; CHECK2:       omp_parallel:
 | |
| ; CHECK2-NEXT:    [[GEP_A_ADDR:%.*]] = getelementptr { i32* }, { i32* }* [[STRUCTARG]], i32 0, i32 0
 | |
| ; CHECK2-NEXT:    store i32* [[A_ADDR]], i32** [[GEP_A_ADDR]], align 8
 | |
| ; CHECK2-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB2]], i32 1, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, { i32* }*)* @merge_3..omp_par to void (i32*, i32*, ...)*), { i32* }* [[STRUCTARG]])
 | |
| ; CHECK2-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT:%.*]]
 | |
| ; CHECK2:       omp.par.outlined.exit:
 | |
| ; CHECK2-NEXT:    br label [[OMP_PAR_EXIT_SPLIT:%.*]]
 | |
| ; CHECK2:       omp.par.exit.split:
 | |
| ; CHECK2-NEXT:    br label [[ENTRY_SPLIT_SPLIT:%.*]]
 | |
| ; CHECK2:       entry.split.split:
 | |
| ; CHECK2-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK2-LABEL: define {{[^@]+}}@merge_3..omp_par
 | |
| ; CHECK2-SAME: (i32* noalias [[TID_ADDR:%.*]], i32* noalias [[ZERO_ADDR:%.*]], { i32* }* [[TMP0:%.*]]) #[[ATTR0]] {
 | |
| ; CHECK2-NEXT:  omp.par.entry:
 | |
| ; CHECK2-NEXT:    [[GEP_A_ADDR:%.*]] = getelementptr { i32* }, { i32* }* [[TMP0]], i32 0, i32 0
 | |
| ; CHECK2-NEXT:    [[LOADGEP_A_ADDR:%.*]] = load i32*, i32** [[GEP_A_ADDR]], align 8
 | |
| ; CHECK2-NEXT:    [[TID_ADDR_LOCAL:%.*]] = alloca i32, align 4
 | |
| ; CHECK2-NEXT:    [[TMP1:%.*]] = load i32, i32* [[TID_ADDR]], align 4
 | |
| ; CHECK2-NEXT:    store i32 [[TMP1]], i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK2-NEXT:    [[TID:%.*]] = load i32, i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK2-NEXT:    br label [[OMP_PAR_REGION:%.*]]
 | |
| ; CHECK2:       omp.par.region:
 | |
| ; CHECK2-NEXT:    br label [[OMP_PAR_MERGED:%.*]]
 | |
| ; CHECK2:       omp.par.merged:
 | |
| ; CHECK2-NEXT:    call void (i32*, i32*, ...) bitcast (void (i32*, i32*, i32*)* @.omp_outlined..22 to void (i32*, i32*, ...)*)(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[LOADGEP_A_ADDR]])
 | |
| ; CHECK2-NEXT:    [[OMP_GLOBAL_THREAD_NUM:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB2]])
 | |
| ; CHECK2-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB3]], i32 [[OMP_GLOBAL_THREAD_NUM]])
 | |
| ; CHECK2-NEXT:    call void (i32*, i32*, ...) bitcast (void (i32*, i32*, i32*)* @.omp_outlined..23 to void (i32*, i32*, ...)*)(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[LOADGEP_A_ADDR]])
 | |
| ; CHECK2-NEXT:    [[OMP_GLOBAL_THREAD_NUM1:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB2]])
 | |
| ; CHECK2-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB3]], i32 [[OMP_GLOBAL_THREAD_NUM1]])
 | |
| ; CHECK2-NEXT:    call void (i32*, i32*, ...) bitcast (void (i32*, i32*, i32*)* @.omp_outlined..24 to void (i32*, i32*, ...)*)(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[LOADGEP_A_ADDR]])
 | |
| ; CHECK2-NEXT:    br label [[ENTRY_SPLIT:%.*]]
 | |
| ; CHECK2:       entry.split:
 | |
| ; CHECK2-NEXT:    br label [[OMP_PAR_REGION_SPLIT:%.*]]
 | |
| ; CHECK2:       omp.par.region.split:
 | |
| ; CHECK2-NEXT:    br label [[OMP_PAR_PRE_FINALIZE:%.*]]
 | |
| ; CHECK2:       omp.par.pre_finalize:
 | |
| ; CHECK2-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT_EXITSTUB:%.*]]
 | |
| ; CHECK2:       omp.par.outlined.exit.exitStub:
 | |
| ; CHECK2-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK2-LABEL: define {{[^@]+}}@.omp_outlined..22
 | |
| ; CHECK2-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK2-NEXT:  entry:
 | |
| ; CHECK2-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK2-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK2-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK2-LABEL: define {{[^@]+}}@.omp_outlined..23
 | |
| ; CHECK2-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK2-NEXT:  entry:
 | |
| ; CHECK2-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK2-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK2-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK2-LABEL: define {{[^@]+}}@.omp_outlined..24
 | |
| ; CHECK2-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK2-NEXT:  entry:
 | |
| ; CHECK2-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK2-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK2-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK2-LABEL: define {{[^@]+}}@merge_3_seq
 | |
| ; CHECK2-SAME: (i32 [[A:%.*]], i32 [[B:%.*]]) local_unnamed_addr {
 | |
| ; CHECK2-NEXT:  entry:
 | |
| ; CHECK2-NEXT:    [[STRUCTARG:%.*]] = alloca { i32*, i32*, i32*, i32* }, align 8
 | |
| ; CHECK2-NEXT:    [[A_RELOADED:%.*]] = alloca i32, align 4
 | |
| ; CHECK2-NEXT:    [[ADD1_SEQ_OUTPUT_ALLOC:%.*]] = alloca i32, align 4
 | |
| ; CHECK2-NEXT:    [[ADD_SEQ_OUTPUT_ALLOC:%.*]] = alloca i32, align 4
 | |
| ; CHECK2-NEXT:    [[A_ADDR:%.*]] = alloca i32, align 4
 | |
| ; CHECK2-NEXT:    store i32 [[A]], i32* [[A_ADDR]], align 4
 | |
| ; CHECK2-NEXT:    [[OMP_GLOBAL_THREAD_NUM7:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB2]])
 | |
| ; CHECK2-NEXT:    store i32 [[A]], i32* [[A_RELOADED]], align 4
 | |
| ; CHECK2-NEXT:    br label [[OMP_PARALLEL:%.*]]
 | |
| ; CHECK2:       omp_parallel:
 | |
| ; CHECK2-NEXT:    [[GEP_A_RELOADED:%.*]] = getelementptr { i32*, i32*, i32*, i32* }, { i32*, i32*, i32*, i32* }* [[STRUCTARG]], i32 0, i32 0
 | |
| ; CHECK2-NEXT:    store i32* [[A_RELOADED]], i32** [[GEP_A_RELOADED]], align 8
 | |
| ; CHECK2-NEXT:    [[GEP_A_ADDR:%.*]] = getelementptr { i32*, i32*, i32*, i32* }, { i32*, i32*, i32*, i32* }* [[STRUCTARG]], i32 0, i32 1
 | |
| ; CHECK2-NEXT:    store i32* [[A_ADDR]], i32** [[GEP_A_ADDR]], align 8
 | |
| ; CHECK2-NEXT:    [[GEP_ADD_SEQ_OUTPUT_ALLOC:%.*]] = getelementptr { i32*, i32*, i32*, i32* }, { i32*, i32*, i32*, i32* }* [[STRUCTARG]], i32 0, i32 2
 | |
| ; CHECK2-NEXT:    store i32* [[ADD_SEQ_OUTPUT_ALLOC]], i32** [[GEP_ADD_SEQ_OUTPUT_ALLOC]], align 8
 | |
| ; CHECK2-NEXT:    [[GEP_ADD1_SEQ_OUTPUT_ALLOC:%.*]] = getelementptr { i32*, i32*, i32*, i32* }, { i32*, i32*, i32*, i32* }* [[STRUCTARG]], i32 0, i32 3
 | |
| ; CHECK2-NEXT:    store i32* [[ADD1_SEQ_OUTPUT_ALLOC]], i32** [[GEP_ADD1_SEQ_OUTPUT_ALLOC]], align 8
 | |
| ; CHECK2-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB2]], i32 1, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, { i32*, i32*, i32*, i32* }*)* @merge_3_seq..omp_par to void (i32*, i32*, ...)*), { i32*, i32*, i32*, i32* }* [[STRUCTARG]])
 | |
| ; CHECK2-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT:%.*]]
 | |
| ; CHECK2:       omp.par.outlined.exit:
 | |
| ; CHECK2-NEXT:    br label [[OMP_PAR_EXIT_SPLIT:%.*]]
 | |
| ; CHECK2:       omp.par.exit.split:
 | |
| ; CHECK2-NEXT:    br label [[ENTRY_SPLIT_SPLIT:%.*]]
 | |
| ; CHECK2:       entry.split.split:
 | |
| ; CHECK2-NEXT:    [[ADD1_SEQ_OUTPUT_LOAD:%.*]] = load i32, i32* [[ADD1_SEQ_OUTPUT_ALLOC]], align 4
 | |
| ; CHECK2-NEXT:    call void @use(i32 [[ADD1_SEQ_OUTPUT_LOAD]])
 | |
| ; CHECK2-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK2-LABEL: define {{[^@]+}}@merge_3_seq..omp_par
 | |
| ; CHECK2-SAME: (i32* noalias [[TID_ADDR:%.*]], i32* noalias [[ZERO_ADDR:%.*]], { i32*, i32*, i32*, i32* }* [[TMP0:%.*]]) #[[ATTR0]] {
 | |
| ; CHECK2-NEXT:  omp.par.entry:
 | |
| ; CHECK2-NEXT:    [[GEP_A_RELOADED:%.*]] = getelementptr { i32*, i32*, i32*, i32* }, { i32*, i32*, i32*, i32* }* [[TMP0]], i32 0, i32 0
 | |
| ; CHECK2-NEXT:    [[LOADGEP_A_RELOADED:%.*]] = load i32*, i32** [[GEP_A_RELOADED]], align 8
 | |
| ; CHECK2-NEXT:    [[GEP_A_ADDR:%.*]] = getelementptr { i32*, i32*, i32*, i32* }, { i32*, i32*, i32*, i32* }* [[TMP0]], i32 0, i32 1
 | |
| ; CHECK2-NEXT:    [[LOADGEP_A_ADDR:%.*]] = load i32*, i32** [[GEP_A_ADDR]], align 8
 | |
| ; CHECK2-NEXT:    [[GEP_ADD_SEQ_OUTPUT_ALLOC:%.*]] = getelementptr { i32*, i32*, i32*, i32* }, { i32*, i32*, i32*, i32* }* [[TMP0]], i32 0, i32 2
 | |
| ; CHECK2-NEXT:    [[LOADGEP_ADD_SEQ_OUTPUT_ALLOC:%.*]] = load i32*, i32** [[GEP_ADD_SEQ_OUTPUT_ALLOC]], align 8
 | |
| ; CHECK2-NEXT:    [[GEP_ADD1_SEQ_OUTPUT_ALLOC:%.*]] = getelementptr { i32*, i32*, i32*, i32* }, { i32*, i32*, i32*, i32* }* [[TMP0]], i32 0, i32 3
 | |
| ; CHECK2-NEXT:    [[LOADGEP_ADD1_SEQ_OUTPUT_ALLOC:%.*]] = load i32*, i32** [[GEP_ADD1_SEQ_OUTPUT_ALLOC]], align 8
 | |
| ; CHECK2-NEXT:    [[TID_ADDR_LOCAL:%.*]] = alloca i32, align 4
 | |
| ; CHECK2-NEXT:    [[TMP1:%.*]] = load i32, i32* [[TID_ADDR]], align 4
 | |
| ; CHECK2-NEXT:    store i32 [[TMP1]], i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK2-NEXT:    [[TID:%.*]] = load i32, i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK2-NEXT:    [[TMP2:%.*]] = load i32, i32* [[LOADGEP_A_RELOADED]], align 4
 | |
| ; CHECK2-NEXT:    br label [[OMP_PAR_REGION:%.*]]
 | |
| ; CHECK2:       omp.par.region:
 | |
| ; CHECK2-NEXT:    br label [[OMP_PAR_MERGED:%.*]]
 | |
| ; CHECK2:       omp.par.merged:
 | |
| ; CHECK2-NEXT:    call void (i32*, i32*, ...) bitcast (void (i32*, i32*, i32*)* @.omp_outlined..25 to void (i32*, i32*, ...)*)(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[LOADGEP_A_ADDR]])
 | |
| ; CHECK2-NEXT:    [[OMP_GLOBAL_THREAD_NUM2:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB2]])
 | |
| ; CHECK2-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB3]], i32 [[OMP_GLOBAL_THREAD_NUM2]])
 | |
| ; CHECK2-NEXT:    [[OMP_GLOBAL_THREAD_NUM:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB2]])
 | |
| ; CHECK2-NEXT:    [[TMP3:%.*]] = call i32 @__kmpc_master(%struct.ident_t* @[[GLOB2]], i32 [[OMP_GLOBAL_THREAD_NUM]])
 | |
| ; CHECK2-NEXT:    [[TMP4:%.*]] = icmp ne i32 [[TMP3]], 0
 | |
| ; CHECK2-NEXT:    br i1 [[TMP4]], label [[OMP_REGION_BODY:%.*]], label [[OMP_REGION_END:%.*]]
 | |
| ; CHECK2:       omp_region.end:
 | |
| ; CHECK2-NEXT:    [[OMP_GLOBAL_THREAD_NUM1:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB2]])
 | |
| ; CHECK2-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB3]], i32 [[OMP_GLOBAL_THREAD_NUM1]])
 | |
| ; CHECK2-NEXT:    br label [[OMP_PAR_MERGED_SPLIT_SPLIT:%.*]]
 | |
| ; CHECK2:       omp.par.merged.split.split:
 | |
| ; CHECK2-NEXT:    call void (i32*, i32*, ...) bitcast (void (i32*, i32*, i32*)* @.omp_outlined..26 to void (i32*, i32*, ...)*)(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[LOADGEP_A_ADDR]])
 | |
| ; CHECK2-NEXT:    [[OMP_GLOBAL_THREAD_NUM4:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB2]])
 | |
| ; CHECK2-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB3]], i32 [[OMP_GLOBAL_THREAD_NUM4]])
 | |
| ; CHECK2-NEXT:    [[OMP_GLOBAL_THREAD_NUM3:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB2]])
 | |
| ; CHECK2-NEXT:    [[TMP5:%.*]] = call i32 @__kmpc_master(%struct.ident_t* @[[GLOB2]], i32 [[OMP_GLOBAL_THREAD_NUM3]])
 | |
| ; CHECK2-NEXT:    [[TMP6:%.*]] = icmp ne i32 [[TMP5]], 0
 | |
| ; CHECK2-NEXT:    br i1 [[TMP6]], label [[OMP_REGION_BODY5:%.*]], label [[OMP_REGION_END4:%.*]]
 | |
| ; CHECK2:       omp_region.end4:
 | |
| ; CHECK2-NEXT:    [[OMP_GLOBAL_THREAD_NUM6:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB2]])
 | |
| ; CHECK2-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB3]], i32 [[OMP_GLOBAL_THREAD_NUM6]])
 | |
| ; CHECK2-NEXT:    br label [[OMP_PAR_MERGED_SPLIT_SPLIT_SPLIT_SPLIT:%.*]]
 | |
| ; CHECK2:       omp.par.merged.split.split.split.split:
 | |
| ; CHECK2-NEXT:    call void (i32*, i32*, ...) bitcast (void (i32*, i32*, i32*)* @.omp_outlined..27 to void (i32*, i32*, ...)*)(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[LOADGEP_A_ADDR]])
 | |
| ; CHECK2-NEXT:    br label [[ENTRY_SPLIT:%.*]]
 | |
| ; CHECK2:       entry.split:
 | |
| ; CHECK2-NEXT:    br label [[OMP_PAR_REGION_SPLIT:%.*]]
 | |
| ; CHECK2:       omp.par.region.split:
 | |
| ; CHECK2-NEXT:    br label [[OMP_PAR_PRE_FINALIZE:%.*]]
 | |
| ; CHECK2:       omp.par.pre_finalize:
 | |
| ; CHECK2-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT_EXITSTUB:%.*]]
 | |
| ; CHECK2:       omp_region.body5:
 | |
| ; CHECK2-NEXT:    br label [[SEQ_PAR_MERGED2:%.*]]
 | |
| ; CHECK2:       seq.par.merged2:
 | |
| ; CHECK2-NEXT:    [[ADD_SEQ_OUTPUT_LOAD:%.*]] = load i32, i32* [[LOADGEP_ADD_SEQ_OUTPUT_ALLOC]], align 4
 | |
| ; CHECK2-NEXT:    [[ADD1:%.*]] = add nsw i32 [[ADD_SEQ_OUTPUT_LOAD]], [[TMP2]]
 | |
| ; CHECK2-NEXT:    store i32 [[ADD1]], i32* [[LOADGEP_ADD1_SEQ_OUTPUT_ALLOC]], align 4
 | |
| ; CHECK2-NEXT:    br label [[OMP_PAR_MERGED_SPLIT_SPLIT_SPLIT:%.*]]
 | |
| ; CHECK2:       omp.par.merged.split.split.split:
 | |
| ; CHECK2-NEXT:    br label [[OMP_REGION_BODY5_SPLIT:%.*]]
 | |
| ; CHECK2:       omp_region.body5.split:
 | |
| ; CHECK2-NEXT:    call void @__kmpc_end_master(%struct.ident_t* @[[GLOB2]], i32 [[OMP_GLOBAL_THREAD_NUM3]])
 | |
| ; CHECK2-NEXT:    br label [[OMP_REGION_END4]]
 | |
| ; CHECK2:       omp_region.body:
 | |
| ; CHECK2-NEXT:    br label [[SEQ_PAR_MERGED:%.*]]
 | |
| ; CHECK2:       seq.par.merged:
 | |
| ; CHECK2-NEXT:    [[ADD:%.*]] = add nsw i32 [[TMP2]], 1
 | |
| ; CHECK2-NEXT:    store i32 [[ADD]], i32* [[LOADGEP_ADD_SEQ_OUTPUT_ALLOC]], align 4
 | |
| ; CHECK2-NEXT:    br label [[OMP_PAR_MERGED_SPLIT:%.*]]
 | |
| ; CHECK2:       omp.par.merged.split:
 | |
| ; CHECK2-NEXT:    br label [[OMP_REGION_BODY_SPLIT:%.*]]
 | |
| ; CHECK2:       omp_region.body.split:
 | |
| ; CHECK2-NEXT:    call void @__kmpc_end_master(%struct.ident_t* @[[GLOB2]], i32 [[OMP_GLOBAL_THREAD_NUM]])
 | |
| ; CHECK2-NEXT:    br label [[OMP_REGION_END]]
 | |
| ; CHECK2:       omp.par.outlined.exit.exitStub:
 | |
| ; CHECK2-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK2-LABEL: define {{[^@]+}}@.omp_outlined..25
 | |
| ; CHECK2-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK2-NEXT:  entry:
 | |
| ; CHECK2-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK2-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK2-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK2-LABEL: define {{[^@]+}}@.omp_outlined..26
 | |
| ; CHECK2-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK2-NEXT:  entry:
 | |
| ; CHECK2-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK2-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK2-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK2-LABEL: define {{[^@]+}}@.omp_outlined..27
 | |
| ; CHECK2-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK2-NEXT:  entry:
 | |
| ; CHECK2-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK2-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK2-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK2-LABEL: define {{[^@]+}}@unmergable_3_seq_call
 | |
| ; CHECK2-SAME: (i32 [[A:%.*]]) local_unnamed_addr {
 | |
| ; CHECK2-NEXT:  entry:
 | |
| ; CHECK2-NEXT:    [[A_ADDR:%.*]] = alloca i32, align 4
 | |
| ; CHECK2-NEXT:    store i32 [[A]], i32* [[A_ADDR]], align 4
 | |
| ; CHECK2-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]], i32 noundef 1, void (i32*, i32*, ...)* noundef bitcast (void (i32*, i32*, i32*)* @.omp_outlined..28 to void (i32*, i32*, ...)*), i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK2-NEXT:    call void (...) @foo()
 | |
| ; CHECK2-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]], i32 noundef 1, void (i32*, i32*, ...)* noundef bitcast (void (i32*, i32*, i32*)* @.omp_outlined..29 to void (i32*, i32*, ...)*), i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK2-NEXT:    call void (...) @foo()
 | |
| ; CHECK2-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]], i32 noundef 1, void (i32*, i32*, ...)* noundef bitcast (void (i32*, i32*, i32*)* @.omp_outlined..30 to void (i32*, i32*, ...)*), i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK2-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK2-LABEL: define {{[^@]+}}@.omp_outlined..28
 | |
| ; CHECK2-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK2-NEXT:  entry:
 | |
| ; CHECK2-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK2-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK2-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK2-LABEL: define {{[^@]+}}@.omp_outlined..29
 | |
| ; CHECK2-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK2-NEXT:  entry:
 | |
| ; CHECK2-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK2-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK2-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK2-LABEL: define {{[^@]+}}@.omp_outlined..30
 | |
| ; CHECK2-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK2-NEXT:  entry:
 | |
| ; CHECK2-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK2-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK2-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK2-LABEL: define {{[^@]+}}@unmergable_3_proc_bind
 | |
| ; CHECK2-SAME: (i32 [[A:%.*]]) local_unnamed_addr {
 | |
| ; CHECK2-NEXT:  entry:
 | |
| ; CHECK2-NEXT:    [[A_ADDR:%.*]] = alloca i32, align 4
 | |
| ; CHECK2-NEXT:    [[TMP0:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]])
 | |
| ; CHECK2-NEXT:    store i32 [[A]], i32* [[A_ADDR]], align 4
 | |
| ; CHECK2-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]], i32 noundef 1, void (i32*, i32*, ...)* noundef bitcast (void (i32*, i32*, i32*)* @.omp_outlined..31 to void (i32*, i32*, ...)*), i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK2-NEXT:    call void @__kmpc_push_proc_bind(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]], i32 [[TMP0]], i32 noundef 3)
 | |
| ; CHECK2-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]], i32 noundef 1, void (i32*, i32*, ...)* noundef bitcast (void (i32*, i32*, i32*)* @.omp_outlined..32 to void (i32*, i32*, ...)*), i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK2-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]], i32 noundef 1, void (i32*, i32*, ...)* noundef bitcast (void (i32*, i32*, i32*)* @.omp_outlined..33 to void (i32*, i32*, ...)*), i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK2-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK2-LABEL: define {{[^@]+}}@.omp_outlined..31
 | |
| ; CHECK2-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK2-NEXT:  entry:
 | |
| ; CHECK2-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK2-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK2-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK2-LABEL: define {{[^@]+}}@.omp_outlined..32
 | |
| ; CHECK2-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK2-NEXT:  entry:
 | |
| ; CHECK2-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK2-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK2-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK2-LABEL: define {{[^@]+}}@.omp_outlined..33
 | |
| ; CHECK2-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK2-NEXT:  entry:
 | |
| ; CHECK2-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK2-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK2-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK2-LABEL: define {{[^@]+}}@unmergable_3_num_threads
 | |
| ; CHECK2-SAME: (i32 [[A:%.*]]) local_unnamed_addr {
 | |
| ; CHECK2-NEXT:  entry:
 | |
| ; CHECK2-NEXT:    [[A_ADDR:%.*]] = alloca i32, align 4
 | |
| ; CHECK2-NEXT:    [[TMP0:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]])
 | |
| ; CHECK2-NEXT:    store i32 [[A]], i32* [[A_ADDR]], align 4
 | |
| ; CHECK2-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]], i32 noundef 1, void (i32*, i32*, ...)* noundef bitcast (void (i32*, i32*, i32*)* @.omp_outlined..34 to void (i32*, i32*, ...)*), i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK2-NEXT:    call void @__kmpc_push_num_threads(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]], i32 [[TMP0]], i32 [[A]])
 | |
| ; CHECK2-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]], i32 noundef 1, void (i32*, i32*, ...)* noundef bitcast (void (i32*, i32*, i32*)* @.omp_outlined..35 to void (i32*, i32*, ...)*), i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK2-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]], i32 noundef 1, void (i32*, i32*, ...)* noundef bitcast (void (i32*, i32*, i32*)* @.omp_outlined..36 to void (i32*, i32*, ...)*), i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK2-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK2-LABEL: define {{[^@]+}}@.omp_outlined..34
 | |
| ; CHECK2-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK2-NEXT:  entry:
 | |
| ; CHECK2-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK2-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK2-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK2-LABEL: define {{[^@]+}}@.omp_outlined..35
 | |
| ; CHECK2-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK2-NEXT:  entry:
 | |
| ; CHECK2-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK2-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK2-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK2-LABEL: define {{[^@]+}}@.omp_outlined..36
 | |
| ; CHECK2-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK2-NEXT:  entry:
 | |
| ; CHECK2-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK2-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK2-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK2-LABEL: define {{[^@]+}}@merge_2_unmergable_1
 | |
| ; CHECK2-SAME: (i32 [[A:%.*]]) local_unnamed_addr {
 | |
| ; CHECK2-NEXT:  entry:
 | |
| ; CHECK2-NEXT:    [[STRUCTARG:%.*]] = alloca { i32* }, align 8
 | |
| ; CHECK2-NEXT:    [[A_ADDR:%.*]] = alloca i32, align 4
 | |
| ; CHECK2-NEXT:    store i32 [[A]], i32* [[A_ADDR]], align 4
 | |
| ; CHECK2-NEXT:    [[OMP_GLOBAL_THREAD_NUM:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB2]])
 | |
| ; CHECK2-NEXT:    br label [[OMP_PARALLEL:%.*]]
 | |
| ; CHECK2:       omp_parallel:
 | |
| ; CHECK2-NEXT:    [[GEP_A_ADDR:%.*]] = getelementptr { i32* }, { i32* }* [[STRUCTARG]], i32 0, i32 0
 | |
| ; CHECK2-NEXT:    store i32* [[A_ADDR]], i32** [[GEP_A_ADDR]], align 8
 | |
| ; CHECK2-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* @[[GLOB2]], i32 1, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, { i32* }*)* @merge_2_unmergable_1..omp_par to void (i32*, i32*, ...)*), { i32* }* [[STRUCTARG]])
 | |
| ; CHECK2-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT:%.*]]
 | |
| ; CHECK2:       omp.par.outlined.exit:
 | |
| ; CHECK2-NEXT:    br label [[OMP_PAR_EXIT_SPLIT:%.*]]
 | |
| ; CHECK2:       omp.par.exit.split:
 | |
| ; CHECK2-NEXT:    br label [[ENTRY_SPLIT_SPLIT:%.*]]
 | |
| ; CHECK2:       entry.split.split:
 | |
| ; CHECK2-NEXT:    call void (...) @foo()
 | |
| ; CHECK2-NEXT:    call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* noundef nonnull align 8 dereferenceable(24) @[[GLOB1]], i32 noundef 1, void (i32*, i32*, ...)* noundef bitcast (void (i32*, i32*, i32*)* @.omp_outlined..39 to void (i32*, i32*, ...)*), i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A_ADDR]])
 | |
| ; CHECK2-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK2-LABEL: define {{[^@]+}}@merge_2_unmergable_1..omp_par
 | |
| ; CHECK2-SAME: (i32* noalias [[TID_ADDR:%.*]], i32* noalias [[ZERO_ADDR:%.*]], { i32* }* [[TMP0:%.*]]) #[[ATTR0]] {
 | |
| ; CHECK2-NEXT:  omp.par.entry:
 | |
| ; CHECK2-NEXT:    [[GEP_A_ADDR:%.*]] = getelementptr { i32* }, { i32* }* [[TMP0]], i32 0, i32 0
 | |
| ; CHECK2-NEXT:    [[LOADGEP_A_ADDR:%.*]] = load i32*, i32** [[GEP_A_ADDR]], align 8
 | |
| ; CHECK2-NEXT:    [[TID_ADDR_LOCAL:%.*]] = alloca i32, align 4
 | |
| ; CHECK2-NEXT:    [[TMP1:%.*]] = load i32, i32* [[TID_ADDR]], align 4
 | |
| ; CHECK2-NEXT:    store i32 [[TMP1]], i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK2-NEXT:    [[TID:%.*]] = load i32, i32* [[TID_ADDR_LOCAL]], align 4
 | |
| ; CHECK2-NEXT:    br label [[OMP_PAR_REGION:%.*]]
 | |
| ; CHECK2:       omp.par.region:
 | |
| ; CHECK2-NEXT:    br label [[OMP_PAR_MERGED:%.*]]
 | |
| ; CHECK2:       omp.par.merged:
 | |
| ; CHECK2-NEXT:    call void (i32*, i32*, ...) bitcast (void (i32*, i32*, i32*)* @.omp_outlined..37 to void (i32*, i32*, ...)*)(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[LOADGEP_A_ADDR]])
 | |
| ; CHECK2-NEXT:    [[OMP_GLOBAL_THREAD_NUM:%.*]] = call i32 @__kmpc_global_thread_num(%struct.ident_t* @[[GLOB2]])
 | |
| ; CHECK2-NEXT:    call void @__kmpc_barrier(%struct.ident_t* @[[GLOB3]], i32 [[OMP_GLOBAL_THREAD_NUM]])
 | |
| ; CHECK2-NEXT:    call void (i32*, i32*, ...) bitcast (void (i32*, i32*, i32*)* @.omp_outlined..38 to void (i32*, i32*, ...)*)(i32* [[TID_ADDR]], i32* [[ZERO_ADDR]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[LOADGEP_A_ADDR]])
 | |
| ; CHECK2-NEXT:    br label [[ENTRY_SPLIT:%.*]]
 | |
| ; CHECK2:       entry.split:
 | |
| ; CHECK2-NEXT:    br label [[OMP_PAR_REGION_SPLIT:%.*]]
 | |
| ; CHECK2:       omp.par.region.split:
 | |
| ; CHECK2-NEXT:    br label [[OMP_PAR_PRE_FINALIZE:%.*]]
 | |
| ; CHECK2:       omp.par.pre_finalize:
 | |
| ; CHECK2-NEXT:    br label [[OMP_PAR_OUTLINED_EXIT_EXITSTUB:%.*]]
 | |
| ; CHECK2:       omp.par.outlined.exit.exitStub:
 | |
| ; CHECK2-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK2-LABEL: define {{[^@]+}}@.omp_outlined..37
 | |
| ; CHECK2-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK2-NEXT:  entry:
 | |
| ; CHECK2-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK2-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK2-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK2-LABEL: define {{[^@]+}}@.omp_outlined..38
 | |
| ; CHECK2-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK2-NEXT:  entry:
 | |
| ; CHECK2-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK2-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK2-NEXT:    ret void
 | |
| ;
 | |
| ;
 | |
| ; CHECK2-LABEL: define {{[^@]+}}@.omp_outlined..39
 | |
| ; CHECK2-SAME: (i32* noalias nocapture nofree readnone [[DOTGLOBAL_TID_:%.*]], i32* noalias nocapture nofree readnone [[DOTBOUND_TID_:%.*]], i32* nocapture nofree noundef nonnull readonly align 4 dereferenceable(4) [[A:%.*]]) {
 | |
| ; CHECK2-NEXT:  entry:
 | |
| ; CHECK2-NEXT:    [[TMP0:%.*]] = load i32, i32* [[A]], align 4
 | |
| ; CHECK2-NEXT:    call void @use(i32 [[TMP0]])
 | |
| ; CHECK2-NEXT:    ret void
 | |
| ;
 |