128 lines
		
	
	
		
			6.5 KiB
		
	
	
	
		
			C
		
	
	
	
			
		
		
	
	
			128 lines
		
	
	
		
			6.5 KiB
		
	
	
	
		
			C
		
	
	
	
| ///
 | |
| /// Perform several driver tests for OpenMP offloading
 | |
| ///
 | |
| 
 | |
| // Until this test is stabilized on all local configurations.
 | |
| // UNSUPPORTED: linux
 | |
| 
 | |
| // REQUIRES: clang-driver
 | |
| // REQUIRES: x86-registered-target
 | |
| // REQUIRES: powerpc-registered-target
 | |
| // REQUIRES: nvptx-registered-target
 | |
| 
 | |
| /// ###########################################################################
 | |
| 
 | |
| /// Check -Xopenmp-target=powerpc64le-ibm-linux-gnu -march=pwr7 is passed when compiling for the device.
 | |
| // RUN:   %clang -### -no-canonical-prefixes -fopenmp=libomp -fopenmp-targets=powerpc64le-ibm-linux-gnu -Xopenmp-target=powerpc64le-ibm-linux-gnu -mcpu=pwr7 %s 2>&1 \
 | |
| // RUN:   | FileCheck -check-prefix=CHK-FOPENMP-EQ-TARGET %s
 | |
| 
 | |
| // CHK-FOPENMP-EQ-TARGET: clang{{.*}} "-target-cpu" "pwr7"
 | |
| 
 | |
| /// ###########################################################################
 | |
| 
 | |
| /// Check -Xopenmp-target -march=pwr7 is passed when compiling for the device.
 | |
| // RUN:   %clang -### -no-canonical-prefixes -fopenmp=libomp -fopenmp-targets=powerpc64le-ibm-linux-gnu -Xopenmp-target -mcpu=pwr7 %s 2>&1 \
 | |
| // RUN:   | FileCheck -check-prefix=CHK-FOPENMP-TARGET %s
 | |
| 
 | |
| // CHK-FOPENMP-TARGET: clang{{.*}} "-target-cpu" "pwr7"
 | |
| 
 | |
| /// ###########################################################################
 | |
| 
 | |
| /// Check -Xopenmp-target triggers error when multiple triples are used.
 | |
| // RUN:   %clang -### -no-canonical-prefixes -fopenmp=libomp -fopenmp-targets=powerpc64le-ibm-linux-gnu,powerpc64le-unknown-linux-gnu -Xopenmp-target -mcpu=pwr8 %s 2>&1 \
 | |
| // RUN:   | FileCheck -check-prefix=CHK-FOPENMP-TARGET-AMBIGUOUS-ERROR %s
 | |
| 
 | |
| // CHK-FOPENMP-TARGET-AMBIGUOUS-ERROR: clang{{.*}} error: cannot deduce implicit triple value for -Xopenmp-target, specify triple using -Xopenmp-target=<triple>
 | |
| 
 | |
| /// ###########################################################################
 | |
| 
 | |
| /// Check -Xopenmp-target triggers error when an option requiring arguments is passed to it.
 | |
| // RUN:   %clang -### -no-canonical-prefixes -fopenmp=libomp -fopenmp-targets=powerpc64le-ibm-linux-gnu -Xopenmp-target -Xopenmp-target -mcpu=pwr8 %s 2>&1 \
 | |
| // RUN:   | FileCheck -check-prefix=CHK-FOPENMP-TARGET-NESTED-ERROR %s
 | |
| 
 | |
| // CHK-FOPENMP-TARGET-NESTED-ERROR: clang{{.*}} error: invalid -Xopenmp-target argument: '-Xopenmp-target -Xopenmp-target', options requiring arguments are unsupported
 | |
| 
 | |
| /// ###########################################################################
 | |
| 
 | |
| /// Check -Xopenmp-target uses one of the archs provided when several archs are used.
 | |
| // RUN:   %clang -### -no-canonical-prefixes -fopenmp=libomp -fopenmp-targets=nvptx64-nvidia-cuda -Xopenmp-target -march=sm_35 -Xopenmp-target -march=sm_60 %s 2>&1 \
 | |
| // RUN:   | FileCheck -check-prefix=CHK-FOPENMP-TARGET-ARCHS %s
 | |
| 
 | |
| // CHK-FOPENMP-TARGET-ARCHS: ptxas{{.*}}" "--gpu-name" "sm_60"
 | |
| // CHK-FOPENMP-TARGET-ARCHS: nvlink{{.*}}" "-arch" "sm_60"
 | |
| 
 | |
| /// ###########################################################################
 | |
| 
 | |
| /// Check -Xopenmp-target -march=sm_35 works as expected when two triples are present.
 | |
| // RUN:   %clang -### -no-canonical-prefixes -fopenmp=libomp -fopenmp-targets=powerpc64le-ibm-linux-gnu,nvptx64-nvidia-cuda -Xopenmp-target=nvptx64-nvidia-cuda -march=sm_35 %s 2>&1 \
 | |
| // RUN:   | FileCheck -check-prefix=CHK-FOPENMP-TARGET-COMPILATION %s
 | |
| 
 | |
| // CHK-FOPENMP-TARGET-COMPILATION: ptxas{{.*}}" "--gpu-name" "sm_35"
 | |
| // CHK-FOPENMP-TARGET-COMPILATION: nvlink{{.*}}" "-arch" "sm_35"
 | |
| 
 | |
| /// ###########################################################################
 | |
| 
 | |
| /// Check cubin file generation and usage by nvlink
 | |
| // RUN:   %clang -### -no-canonical-prefixes -fopenmp=libomp -fopenmp-targets=nvptx64-nvidia-cuda -save-temps %s 2>&1 \
 | |
| // RUN:   | FileCheck -check-prefix=CHK-CUBIN %s
 | |
| 
 | |
| // CHK-CUBIN: clang{{.*}}" "-o" "{{.*}}.s"
 | |
| // CHK-CUBIN-NEXT: ptxas{{.*}}" "--output-file" {{.*}}.cubin" {{.*}}.s"
 | |
| // CHK-CUBIN-NEXT: nvlink" {{.*}}.cubin"
 | |
| 
 | |
| 
 | |
| /// ###########################################################################
 | |
| 
 | |
| /// Check cubin file generation and usage by nvlink when toolchain has BindArchAction
 | |
| // RUN:   %clang -### -no-canonical-prefixes -target x86_64-apple-darwin17.0.0 -fopenmp=libomp -fopenmp-targets=nvptx64-nvidia-cuda %s 2>&1 \
 | |
| // RUN:   | FileCheck -check-prefix=CHK-CUBIN-DARWIN %s
 | |
| 
 | |
| // CHK-CUBIN-DARWIN: clang{{.*}}" "-o" "{{.*}}.s"
 | |
| // CHK-CUBIN-DARWIN-NEXT: ptxas{{.*}}" "--output-file" {{.*}}.cubin" {{.*}}.s"
 | |
| // CHK-CUBIN-DARWIN-NEXT: nvlink" {{.*}}.cubin"
 | |
| 
 | |
| /// ###########################################################################
 | |
| 
 | |
| /// Check cubin file generation and usage by nvlink
 | |
| // RUN:   touch %t1.o
 | |
| // RUN:   touch %t2.o
 | |
| // RUN:   %clang -### -no-canonical-prefixes -fopenmp=libomp -fopenmp-targets=nvptx64-nvidia-cuda %t1.o %t2.o 2>&1 \
 | |
| // RUN:   | FileCheck -check-prefix=CHK-TWOCUBIN %s
 | |
| 
 | |
| // CHK-TWOCUBIN: nvlink"{{.*}}"openmp-offload-{{.*}}.cubin" "openmp-offload-{{.*}}.cubin"
 | |
| 
 | |
| /// ###########################################################################
 | |
| 
 | |
| /// Check cubin file generation and usage by nvlink when toolchain has BindArchAction
 | |
| // RUN:   touch %t1.o
 | |
| // RUN:   touch %t2.o
 | |
| // RUN:   %clang -### -no-canonical-prefixes -target x86_64-apple-darwin17.0.0 -fopenmp=libomp -fopenmp-targets=nvptx64-nvidia-cuda %t1.o %t2.o 2>&1 \
 | |
| // RUN:   | FileCheck -check-prefix=CHK-TWOCUBIN-DARWIN %s
 | |
| 
 | |
| // CHK-TWOCUBIN-DARWIN: nvlink"{{.*}}"openmp-offload-{{.*}}.cubin" "openmp-offload-{{.*}}.cubin"
 | |
| 
 | |
| /// ###########################################################################
 | |
| 
 | |
| /// Check PTXAS is passed -c flag when offloading to an NVIDIA device using OpenMP.
 | |
| // RUN:   %clang -### -fopenmp=libomp -fopenmp-targets=nvptx64-nvidia-cuda -no-canonical-prefixes %s 2>&1 \
 | |
| // RUN:   | FileCheck -check-prefix=CHK-PTXAS-DEFAULT %s
 | |
| 
 | |
| // CHK-PTXAS-DEFAULT: ptxas{{.*}}" "-c"
 | |
| 
 | |
| /// ###########################################################################
 | |
| 
 | |
| /// PTXAS is passed -c flag by default when offloading to an NVIDIA device using OpenMP - disable it.
 | |
| // RUN:   %clang -### -fopenmp=libomp -fopenmp-targets=nvptx64-nvidia-cuda -fnoopenmp-relocatable-target -save-temps -no-canonical-prefixes %s 2>&1 \
 | |
| // RUN:   | FileCheck -check-prefix=CHK-PTXAS-NORELO %s
 | |
| 
 | |
| // CHK-PTXAS-NORELO-NOT: ptxas{{.*}}" "-c"
 | |
| 
 | |
| /// ###########################################################################
 | |
| 
 | |
| /// PTXAS is passed -c flag by default when offloading to an NVIDIA device using OpenMP
 | |
| /// Check that the flag is passed when -fopenmp-relocatable-target is used.
 | |
| // RUN:   %clang -### -fopenmp=libomp -fopenmp-targets=nvptx64-nvidia-cuda -fopenmp-relocatable-target -save-temps -no-canonical-prefixes %s 2>&1 \
 | |
| // RUN:   | FileCheck -check-prefix=CHK-PTXAS-RELO %s
 | |
| 
 | |
| // CHK-PTXAS-RELO: ptxas{{.*}}" "-c"
 |