186 lines
		
	
	
		
			8.1 KiB
		
	
	
	
		
			LLVM
		
	
	
	
			
		
		
	
	
			186 lines
		
	
	
		
			8.1 KiB
		
	
	
	
		
			LLVM
		
	
	
	
| ; NOTE: Assertions have been autogenerated by utils/update_test_checks.py
 | |
| ; RUN: opt -function-specialization -func-specialization-max-clones=0 -func-specialization-size-threshold=14 -S < %s | FileCheck %s --check-prefix=NONE
 | |
| ; RUN: opt -function-specialization -func-specialization-max-clones=1 -func-specialization-size-threshold=14 -S < %s | FileCheck %s --check-prefix=ONE
 | |
| ; RUN: opt -function-specialization -func-specialization-max-clones=2 -func-specialization-size-threshold=14 -S < %s | FileCheck %s --check-prefix=TWO
 | |
| ; RUN: opt -function-specialization -func-specialization-max-clones=3 -func-specialization-size-threshold=14 -S < %s | FileCheck %s --check-prefix=THREE
 | |
| 
 | |
| ; Make sure that we iterate correctly after sorting the specializations:
 | |
| ; FnSpecialization: Specializations for function compute
 | |
| ; FnSpecialization:   Gain = 608
 | |
| ; FnSpecialization:   FormalArg = binop1, ActualArg = power
 | |
| ; FnSpecialization:   FormalArg = binop2, ActualArg = mul
 | |
| ; FnSpecialization:   Gain = 982
 | |
| ; FnSpecialization:   FormalArg = binop1, ActualArg = plus
 | |
| ; FnSpecialization:   FormalArg = binop2, ActualArg = minus
 | |
| ; FnSpecialization:   Gain = 795
 | |
| ; FnSpecialization:   FormalArg = binop1, ActualArg = minus
 | |
| ; FnSpecialization:   FormalArg = binop2, ActualArg = power
 | |
| 
 | |
| define i64 @main(i64 %x, i64 %y, i1 %flag) {
 | |
| ; NONE-LABEL: @main(
 | |
| ; NONE-NEXT:  entry:
 | |
| ; NONE-NEXT:    br i1 [[FLAG:%.*]], label [[PLUS:%.*]], label [[MINUS:%.*]]
 | |
| ; NONE:       plus:
 | |
| ; NONE-NEXT:    [[TMP0:%.*]] = call i64 @compute(i64 [[X:%.*]], i64 [[Y:%.*]], i64 (i64, i64)* @power, i64 (i64, i64)* @mul)
 | |
| ; NONE-NEXT:    br label [[MERGE:%.*]]
 | |
| ; NONE:       minus:
 | |
| ; NONE-NEXT:    [[TMP1:%.*]] = call i64 @compute(i64 [[X]], i64 [[Y]], i64 (i64, i64)* @plus, i64 (i64, i64)* @minus)
 | |
| ; NONE-NEXT:    br label [[MERGE]]
 | |
| ; NONE:       merge:
 | |
| ; NONE-NEXT:    [[TMP2:%.*]] = phi i64 [ [[TMP0]], [[PLUS]] ], [ [[TMP1]], [[MINUS]] ]
 | |
| ; NONE-NEXT:    [[TMP3:%.*]] = call i64 @compute(i64 [[TMP2]], i64 42, i64 (i64, i64)* @minus, i64 (i64, i64)* @power)
 | |
| ; NONE-NEXT:    ret i64 [[TMP3]]
 | |
| ;
 | |
| ; ONE-LABEL: @main(
 | |
| ; ONE-NEXT:  entry:
 | |
| ; ONE-NEXT:    br i1 [[FLAG:%.*]], label [[PLUS:%.*]], label [[MINUS:%.*]]
 | |
| ; ONE:       plus:
 | |
| ; ONE-NEXT:    [[TMP0:%.*]] = call i64 @compute(i64 [[X:%.*]], i64 [[Y:%.*]], i64 (i64, i64)* @power, i64 (i64, i64)* @mul)
 | |
| ; ONE-NEXT:    br label [[MERGE:%.*]]
 | |
| ; ONE:       minus:
 | |
| ; ONE-NEXT:    [[TMP1:%.*]] = call i64 @compute.1(i64 [[X]], i64 [[Y]], i64 (i64, i64)* @plus, i64 (i64, i64)* @minus)
 | |
| ; ONE-NEXT:    br label [[MERGE]]
 | |
| ; ONE:       merge:
 | |
| ; ONE-NEXT:    [[TMP2:%.*]] = phi i64 [ [[TMP0]], [[PLUS]] ], [ [[TMP1]], [[MINUS]] ]
 | |
| ; ONE-NEXT:    [[TMP3:%.*]] = call i64 @compute(i64 [[TMP2]], i64 42, i64 (i64, i64)* @minus, i64 (i64, i64)* @power)
 | |
| ; ONE-NEXT:    ret i64 [[TMP3]]
 | |
| ;
 | |
| ; TWO-LABEL: @main(
 | |
| ; TWO-NEXT:  entry:
 | |
| ; TWO-NEXT:    br i1 [[FLAG:%.*]], label [[PLUS:%.*]], label [[MINUS:%.*]]
 | |
| ; TWO:       plus:
 | |
| ; TWO-NEXT:    [[TMP0:%.*]] = call i64 @compute(i64 [[X:%.*]], i64 [[Y:%.*]], i64 (i64, i64)* @power, i64 (i64, i64)* @mul)
 | |
| ; TWO-NEXT:    br label [[MERGE:%.*]]
 | |
| ; TWO:       minus:
 | |
| ; TWO-NEXT:    [[TMP1:%.*]] = call i64 @compute.1(i64 [[X]], i64 [[Y]], i64 (i64, i64)* @plus, i64 (i64, i64)* @minus)
 | |
| ; TWO-NEXT:    br label [[MERGE]]
 | |
| ; TWO:       merge:
 | |
| ; TWO-NEXT:    [[TMP2:%.*]] = phi i64 [ [[TMP0]], [[PLUS]] ], [ [[TMP1]], [[MINUS]] ]
 | |
| ; TWO-NEXT:    [[TMP3:%.*]] = call i64 @compute.2(i64 [[TMP2]], i64 42, i64 (i64, i64)* @minus, i64 (i64, i64)* @power)
 | |
| ; TWO-NEXT:    ret i64 [[TMP3]]
 | |
| ;
 | |
| ; THREE-LABEL: @main(
 | |
| ; THREE-NEXT:  entry:
 | |
| ; THREE-NEXT:    br i1 [[FLAG:%.*]], label [[PLUS:%.*]], label [[MINUS:%.*]]
 | |
| ; THREE:       plus:
 | |
| ; THREE-NEXT:    [[TMP0:%.*]] = call i64 @compute.3(i64 [[X:%.*]], i64 [[Y:%.*]], i64 (i64, i64)* @power, i64 (i64, i64)* @mul)
 | |
| ; THREE-NEXT:    br label [[MERGE:%.*]]
 | |
| ; THREE:       minus:
 | |
| ; THREE-NEXT:    [[TMP1:%.*]] = call i64 @compute.1(i64 [[X]], i64 [[Y]], i64 (i64, i64)* @plus, i64 (i64, i64)* @minus)
 | |
| ; THREE-NEXT:    br label [[MERGE]]
 | |
| ; THREE:       merge:
 | |
| ; THREE-NEXT:    [[TMP2:%.*]] = phi i64 [ [[TMP0]], [[PLUS]] ], [ [[TMP1]], [[MINUS]] ]
 | |
| ; THREE-NEXT:    [[TMP3:%.*]] = call i64 @compute.2(i64 [[TMP2]], i64 42, i64 (i64, i64)* @minus, i64 (i64, i64)* @power)
 | |
| ; THREE-NEXT:    ret i64 [[TMP3]]
 | |
| ;
 | |
| entry:
 | |
|   br i1 %flag, label %plus, label %minus
 | |
| 
 | |
| plus:
 | |
|   %tmp0 = call i64 @compute(i64 %x, i64 %y, i64 (i64, i64)* @power, i64 (i64, i64)* @mul)
 | |
|   br label %merge
 | |
| 
 | |
| minus:
 | |
|   %tmp1 = call i64 @compute(i64 %x, i64 %y, i64 (i64, i64)* @plus, i64 (i64, i64)* @minus)
 | |
|   br label %merge
 | |
| 
 | |
| merge:
 | |
|   %tmp2 = phi i64 [ %tmp0, %plus ], [ %tmp1, %minus]
 | |
|   %tmp3 = call i64 @compute(i64 %tmp2, i64 42, i64 (i64, i64)* @minus, i64 (i64, i64)* @power)
 | |
|   ret i64 %tmp3
 | |
| }
 | |
| 
 | |
| ; THREE-NOT: define internal i64 @compute
 | |
| ;
 | |
| ; THREE-LABEL: define internal i64 @compute.1(i64 %x, i64 %y, i64 (i64, i64)* %binop1, i64 (i64, i64)* %binop2) {
 | |
| ; THREE-NEXT:  entry:
 | |
| ; THREE-NEXT:    [[TMP0:%.+]] = call i64 @plus(i64 %x, i64 %y)
 | |
| ; THREE-NEXT:    [[TMP1:%.+]] = call i64 @minus(i64 %x, i64 %y)
 | |
| ; THREE-NEXT:    [[TMP2:%.+]] = add i64 [[TMP0]], [[TMP1]]
 | |
| ; THREE-NEXT:    [[TMP3:%.+]] = sdiv i64 [[TMP2]], %x
 | |
| ; THREE-NEXT:    [[TMP4:%.+]] = sub i64 [[TMP3]], %y
 | |
| ; THREE-NEXT:    [[TMP5:%.+]] = mul i64 [[TMP4]], 2
 | |
| ; THREE-NEXT:    ret i64 [[TMP5]]
 | |
| ; THREE-NEXT:  }
 | |
| ;
 | |
| ; THREE-LABEL: define internal i64 @compute.2(i64 %x, i64 %y, i64 (i64, i64)* %binop1, i64 (i64, i64)* %binop2) {
 | |
| ; THREE-NEXT:  entry:
 | |
| ; THREE-NEXT:    [[TMP0:%.+]] = call i64 @minus(i64 %x, i64 %y)
 | |
| ; THREE-NEXT:    [[TMP1:%.+]] = call i64 @power(i64 %x, i64 %y)
 | |
| ; THREE-NEXT:    [[TMP2:%.+]] = add i64 [[TMP0]], [[TMP1]]
 | |
| ; THREE-NEXT:    [[TMP3:%.+]] = sdiv i64 [[TMP2]], %x
 | |
| ; THREE-NEXT:    [[TMP4:%.+]] = sub i64 [[TMP3]], %y
 | |
| ; THREE-NEXT:    [[TMP5:%.+]] = mul i64 [[TMP4]], 2
 | |
| ; THREE-NEXT:    ret i64 [[TMP5]]
 | |
| ; THREE-NEXT:  }
 | |
| ;
 | |
| ; THREE-LABEL: define internal i64 @compute.3(i64 %x, i64 %y, i64 (i64, i64)* %binop1, i64 (i64, i64)* %binop2) {
 | |
| ; THREE-NEXT:  entry:
 | |
| ; THREE-NEXT:    [[TMP0:%.+]] = call i64 @power(i64 %x, i64 %y)
 | |
| ; THREE-NEXT:    [[TMP1:%.+]] = call i64 @mul(i64 %x, i64 %y)
 | |
| ; THREE-NEXT:    [[TMP2:%.+]] = add i64 [[TMP0]], [[TMP1]]
 | |
| ; THREE-NEXT:    [[TMP3:%.+]] = sdiv i64 [[TMP2]], %x
 | |
| ; THREE-NEXT:    [[TMP4:%.+]] = sub i64 [[TMP3]], %y
 | |
| ; THREE-NEXT:    [[TMP5:%.+]] = mul i64 [[TMP4]], 2
 | |
| ; THREE-NEXT:    ret i64 [[TMP5]]
 | |
| ; THREE-NEXT:  }
 | |
| ;
 | |
| define internal i64 @compute(i64 %x, i64 %y, i64 (i64, i64)* %binop1, i64 (i64, i64)* %binop2) {
 | |
| entry:
 | |
|   %tmp0 = call i64 %binop1(i64 %x, i64 %y)
 | |
|   %tmp1 = call i64 %binop2(i64 %x, i64 %y)
 | |
|   %add = add i64 %tmp0, %tmp1
 | |
|   %div = sdiv i64 %add, %x
 | |
|   %sub = sub i64 %div, %y
 | |
|   %mul = mul i64 %sub, 2
 | |
|   ret i64 %mul
 | |
| }
 | |
| 
 | |
| define internal i64 @plus(i64 %x, i64 %y) {
 | |
| entry:
 | |
|   %tmp0 = add i64 %x, %y
 | |
|   ret i64 %tmp0
 | |
| }
 | |
| 
 | |
| define internal i64 @minus(i64 %x, i64 %y) {
 | |
| entry:
 | |
|   %tmp0 = sub i64 %x, %y
 | |
|   ret i64 %tmp0
 | |
| }
 | |
| 
 | |
| define internal i64 @mul(i64 %x, i64 %n) {
 | |
| entry:
 | |
|   %cmp6 = icmp sgt i64 %n, 1
 | |
|   br i1 %cmp6, label %for.body, label %for.cond.cleanup
 | |
| 
 | |
| for.cond.cleanup:                                 ; preds = %for.body, %entry
 | |
|   %x.addr.0.lcssa = phi i64 [ %x, %entry ], [ %add, %for.body ]
 | |
|   ret i64 %x.addr.0.lcssa
 | |
| 
 | |
| for.body:                                         ; preds = %entry, %for.body
 | |
|   %indvars.iv = phi i64 [ %indvars.iv.next, %for.body ], [ 1, %entry ]
 | |
|   %x.addr.07 = phi i64 [ %add, %for.body ], [ %x, %entry ]
 | |
|   %add = shl nsw i64 %x.addr.07, 1
 | |
|   %indvars.iv.next = add nuw nsw i64 %indvars.iv, 1
 | |
|   %exitcond.not = icmp eq i64 %indvars.iv.next, %n
 | |
|   br i1 %exitcond.not, label %for.cond.cleanup, label %for.body
 | |
| }
 | |
| 
 | |
| define internal i64 @power(i64 %x, i64 %n) {
 | |
| entry:
 | |
|   %cmp6 = icmp sgt i64 %n, 1
 | |
|   br i1 %cmp6, label %for.body, label %for.cond.cleanup
 | |
| 
 | |
| for.cond.cleanup:                                 ; preds = %for.body, %entry
 | |
|   %x.addr.0.lcssa = phi i64 [ %x, %entry ], [ %mul, %for.body ]
 | |
|   ret i64 %x.addr.0.lcssa
 | |
| 
 | |
| for.body:                                         ; preds = %entry, %for.body
 | |
|   %indvars.iv = phi i64 [ %indvars.iv.next, %for.body ], [ 1, %entry ]
 | |
|   %x.addr.07 = phi i64 [ %mul, %for.body ], [ %x, %entry ]
 | |
|   %mul = mul nsw i64 %x.addr.07, %x.addr.07
 | |
|   %indvars.iv.next = add nuw nsw i64 %indvars.iv, 1
 | |
|   %exitcond.not = icmp eq i64 %indvars.iv.next, %n
 | |
|   br i1 %exitcond.not, label %for.cond.cleanup, label %for.body
 | |
| }
 |