1 | // REQUIRES: clang-driver |
2 | // REQUIRES: x86-registered-target |
3 | // REQUIRES: nvptx-registered-target |
4 | // |
5 | // Check that we properly detect CUDA installation. |
6 | // RUN: %clang -v --target=i386-unknown-linux \ |
7 | // RUN: --sysroot=%S/no-cuda-there --cuda-path-ignore-env 2>&1 | FileCheck %s -check-prefix NOCUDA |
8 | // RUN: %clang -v --target=i386-apple-macosx \ |
9 | // RUN: --sysroot=%S/no-cuda-there --cuda-path-ignore-env 2>&1 | FileCheck %s -check-prefix NOCUDA |
10 | // RUN: %clang -v --target=x86_64-unknown-linux \ |
11 | // RUN: --sysroot=%S/no-cuda-there --cuda-path-ignore-env 2>&1 | FileCheck %s -check-prefix NOCUDA |
12 | // RUN: %clang -v --target=x86_64-apple-macosx \ |
13 | // RUN: --sysroot=%S/no-cuda-there --cuda-path-ignore-env 2>&1 | FileCheck %s -check-prefix NOCUDA |
14 | |
15 | |
16 | // RUN: %clang -v --target=i386-unknown-linux \ |
17 | // RUN: --sysroot=%S/Inputs/CUDA --cuda-path-ignore-env 2>&1 | FileCheck %s |
18 | // RUN: %clang -v --target=i386-apple-macosx \ |
19 | // RUN: --sysroot=%S/Inputs/CUDA --cuda-path-ignore-env 2>&1 | FileCheck %s |
20 | |
21 | // RUN: %clang -v --target=i386-unknown-linux \ |
22 | // RUN: --cuda-path=%S/Inputs/CUDA/usr/local/cuda 2>&1 | FileCheck %s |
23 | // RUN: %clang -v --target=i386-apple-macosx \ |
24 | // RUN: --cuda-path=%S/Inputs/CUDA/usr/local/cuda 2>&1 | FileCheck %s |
25 | |
26 | // Check that we don't find a CUDA installation without libdevice ... |
27 | // RUN: %clang -v --target=i386-unknown-linux \ |
28 | // RUN: --sysroot=%S/Inputs/CUDA-nolibdevice --cuda-path-ignore-env 2>&1 | FileCheck %s -check-prefix NOCUDA |
29 | // RUN: %clang -v --target=i386-apple-macosx \ |
30 | // RUN: --sysroot=%S/Inputs/CUDA-nolibdevice --cuda-path-ignore-env 2>&1 | FileCheck %s -check-prefix NOCUDA |
31 | // RUN: %clang -v --target=x86_64-unknown-linux \ |
32 | // RUN: --sysroot=%S/Inputs/CUDA-nolibdevice --cuda-path-ignore-env 2>&1 | FileCheck %s -check-prefix NOCUDA |
33 | // RUN: %clang -v --target=x84_64-apple-macosx \ |
34 | // RUN: --sysroot=%S/Inputs/CUDA-nolibdevice --cuda-path-ignore-env 2>&1 | FileCheck %s -check-prefix NOCUDA |
35 | |
36 | // ... unless the user doesn't need libdevice |
37 | // RUN: %clang -v --target=i386-unknown-linux -nocudalib \ |
38 | // RUN: --sysroot=%S/Inputs/CUDA-nolibdevice --cuda-path-ignore-env 2>&1 | FileCheck %s -check-prefix NO-LIBDEVICE |
39 | // RUN: %clang -v --target=i386-apple-macosx -nocudalib \ |
40 | // RUN: --sysroot=%S/Inputs/CUDA-nolibdevice --cuda-path-ignore-env 2>&1 | FileCheck %s -check-prefix NO-LIBDEVICE |
41 | // RUN: %clang -v --target=x86_64-unknown-linux -nocudalib \ |
42 | // RUN: --sysroot=%S/Inputs/CUDA-nolibdevice --cuda-path-ignore-env 2>&1 | FileCheck %s -check-prefix NO-LIBDEVICE |
43 | // RUN: %clang -v --target=x86_64-apple-macosx -nocudalib \ |
44 | // RUN: --sysroot=%S/Inputs/CUDA-nolibdevice --cuda-path-ignore-env 2>&1 | FileCheck %s -check-prefix NO-LIBDEVICE |
45 | |
46 | |
47 | // Make sure we map libdevice bitcode files to proper GPUs. These |
48 | // tests use Inputs/CUDA_80 which has full set of libdevice files. |
49 | // However, libdevice mapping only matches CUDA-7.x at the moment. |
50 | // sm_2x, sm_32 -> compute_20 |
51 | // RUN: %clang -### -v --target=i386-unknown-linux --cuda-gpu-arch=sm_21 \ |
52 | // RUN: --cuda-path=%S/Inputs/CUDA_80/usr/local/cuda %s 2>&1 \ |
53 | // RUN: | FileCheck %s -check-prefix COMMON \ |
54 | // RUN: -check-prefix LIBDEVICE -check-prefix LIBDEVICE20 |
55 | // RUN: %clang -### -v --target=i386-unknown-linux --cuda-gpu-arch=sm_32 \ |
56 | // RUN: --cuda-path=%S/Inputs/CUDA_80/usr/local/cuda %s 2>&1 \ |
57 | // RUN: | FileCheck %s -check-prefix COMMON \ |
58 | // RUN: -check-prefix LIBDEVICE -check-prefix LIBDEVICE20 |
59 | // sm_30, sm_6x map to compute_30. |
60 | // RUN: %clang -### -v --target=i386-unknown-linux --cuda-gpu-arch=sm_30 \ |
61 | // RUN: --cuda-path=%S/Inputs/CUDA_80/usr/local/cuda %s 2>&1 \ |
62 | // RUN: | FileCheck %s -check-prefix COMMON \ |
63 | // RUN: -check-prefix LIBDEVICE -check-prefix LIBDEVICE30 |
64 | // sm_5x is a special case. Maps to compute_30 for cuda-7.x only. |
65 | // RUN: %clang -### -v --target=i386-unknown-linux --cuda-gpu-arch=sm_50 \ |
66 | // RUN: --cuda-path=%S/Inputs/CUDA/usr/local/cuda %s 2>&1 \ |
67 | // RUN: | FileCheck %s -check-prefix COMMON \ |
68 | // RUN: -check-prefix LIBDEVICE -check-prefix LIBDEVICE30 |
69 | // RUN: %clang -### -v --target=i386-unknown-linux --cuda-gpu-arch=sm_60 \ |
70 | // RUN: --cuda-path=%S/Inputs/CUDA_80/usr/local/cuda %s 2>&1 \ |
71 | // RUN: | FileCheck %s -check-prefix COMMON \ |
72 | // RUN: -check-prefix LIBDEVICE -check-prefix LIBDEVICE30 |
73 | // sm_35 and sm_37 -> compute_35 |
74 | // RUN: %clang -### -v --target=i386-unknown-linux --cuda-gpu-arch=sm_35 \ |
75 | // RUN: --cuda-path=%S/Inputs/CUDA_80/usr/local/cuda %s 2>&1 \ |
76 | // RUN: | FileCheck %s -check-prefix COMMON -check-prefix CUDAINC \ |
77 | // RUN: -check-prefix LIBDEVICE -check-prefix LIBDEVICE35 |
78 | // RUN: %clang -### -v --target=i386-unknown-linux --cuda-gpu-arch=sm_37 \ |
79 | // RUN: --cuda-path=%S/Inputs/CUDA_80/usr/local/cuda %s 2>&1 \ |
80 | // RUN: | FileCheck %s -check-prefix COMMON -check-prefix CUDAINC \ |
81 | // RUN: -check-prefix LIBDEVICE -check-prefix LIBDEVICE35 |
82 | // sm_5x -> compute_50 for CUDA-8.0 and newer. |
83 | // RUN: %clang -### -v --target=i386-unknown-linux --cuda-gpu-arch=sm_50 \ |
84 | // RUN: --cuda-path=%S/Inputs/CUDA_80/usr/local/cuda %s 2>&1 \ |
85 | // RUN: | FileCheck %s -check-prefix COMMON \ |
86 | // RUN: -check-prefix LIBDEVICE -check-prefix LIBDEVICE50 |
87 | |
88 | // Verify that -nocudainc prevents adding include path to CUDA headers. |
89 | // RUN: %clang -### -v --target=i386-unknown-linux --cuda-gpu-arch=sm_35 \ |
90 | // RUN: -nocudainc --cuda-path=%S/Inputs/CUDA/usr/local/cuda %s 2>&1 \ |
91 | // RUN: | FileCheck %s -check-prefix COMMON -check-prefix NOCUDAINC \ |
92 | // RUN: -check-prefix LIBDEVICE -check-prefix LIBDEVICE35 |
93 | // RUN: %clang -### -v --target=i386-apple-macosx --cuda-gpu-arch=sm_35 \ |
94 | // RUN: -nocudainc --cuda-path=%S/Inputs/CUDA/usr/local/cuda %s 2>&1 \ |
95 | // RUN: | FileCheck %s -check-prefix COMMON -check-prefix NOCUDAINC \ |
96 | // RUN: -check-prefix LIBDEVICE -check-prefix LIBDEVICE35 |
97 | |
98 | // We should not add any CUDA include paths if there's no valid CUDA installation |
99 | // RUN: %clang -### -v --target=i386-unknown-linux --cuda-gpu-arch=sm_35 \ |
100 | // RUN: --cuda-path=%S/no-cuda-there %s 2>&1 \ |
101 | // RUN: | FileCheck %s -check-prefix COMMON -check-prefix NOCUDAINC |
102 | // RUN: %clang -### -v --target=i386-apple-macosx --cuda-gpu-arch=sm_35 \ |
103 | // RUN: --cuda-path=%S/no-cuda-there %s 2>&1 \ |
104 | // RUN: | FileCheck %s -check-prefix COMMON -check-prefix NOCUDAINC |
105 | |
106 | // Verify that we get an error if there's no libdevice library to link with. |
107 | // NOTE: Inputs/CUDA deliberately does *not* have libdevice.compute_20 for this purpose. |
108 | // RUN: %clang -### -v --target=i386-unknown-linux --cuda-gpu-arch=sm_20 \ |
109 | // RUN: --cuda-path=%S/Inputs/CUDA/usr/local/cuda %s 2>&1 \ |
110 | // RUN: | FileCheck %s -check-prefix COMMON -check-prefix MISSINGLIBDEVICE |
111 | // RUN: %clang -### -v --target=i386-apple-macosx --cuda-gpu-arch=sm_20 \ |
112 | // RUN: --cuda-path=%S/Inputs/CUDA/usr/local/cuda %s 2>&1 \ |
113 | // RUN: | FileCheck %s -check-prefix COMMON -check-prefix MISSINGLIBDEVICE |
114 | |
115 | // Verify that -nocudalib prevents linking libdevice bitcode in. |
116 | // RUN: %clang -### -v --target=i386-unknown-linux --cuda-gpu-arch=sm_35 \ |
117 | // RUN: -nocudalib --cuda-path=%S/Inputs/CUDA/usr/local/cuda %s 2>&1 \ |
118 | // RUN: | FileCheck %s -check-prefix COMMON -check-prefix NOLIBDEVICE |
119 | // RUN: %clang -### -v --target=i386-apple-macosx --cuda-gpu-arch=sm_35 \ |
120 | // RUN: -nocudalib --cuda-path=%S/Inputs/CUDA/usr/local/cuda %s 2>&1 \ |
121 | // RUN: | FileCheck %s -check-prefix COMMON -check-prefix NOLIBDEVICE |
122 | |
123 | // Verify that we don't add include paths, link with libdevice or |
124 | // -include __clang_cuda_runtime_wrapper.h without valid CUDA installation. |
125 | // RUN: %clang -### -v --target=i386-unknown-linux --cuda-gpu-arch=sm_35 \ |
126 | // RUN: --cuda-path=%S/no-cuda-there %s 2>&1 \ |
127 | // RUN: | FileCheck %s -check-prefix COMMON \ |
128 | // RUN: -check-prefix NOCUDAINC -check-prefix NOLIBDEVICE |
129 | // RUN: %clang -### -v --target=i386-apple-macosx --cuda-gpu-arch=sm_35 \ |
130 | // RUN: --cuda-path=%S/no-cuda-there %s 2>&1 \ |
131 | // RUN: | FileCheck %s -check-prefix COMMON \ |
132 | // RUN: -check-prefix NOCUDAINC -check-prefix NOLIBDEVICE |
133 | |
134 | // Verify that C++ include paths are passed for both host and device frontends. |
135 | // RUN: %clang -### -no-canonical-prefixes -target x86_64-linux-gnu %s \ |
136 | // RUN: --stdlib=libstdc++ --sysroot=%S/Inputs/ubuntu_14.04_multiarch_tree2 \ |
137 | // RUN: --gcc-toolchain="" 2>&1 \ |
138 | // RUN: | FileCheck %s --check-prefix CHECK-CXXINCLUDE |
139 | |
140 | // Verify that CUDA SDK version is propagated to the CC1 compilations. |
141 | // RUN: %clang -### -v -target x86_64-linux-gnu --cuda-gpu-arch=sm_50 \ |
142 | // RUN: --cuda-path=%S/Inputs/CUDA_80/usr/local/cuda %s 2>&1 \ |
143 | // RUN: | FileCheck %s -check-prefix CUDA80 |
144 | |
145 | // Verify that if no version file is found, we report the default of 7.0. |
146 | // RUN: %clang -### -v -target x86_64-linux-gnu --cuda-gpu-arch=sm_50 \ |
147 | // RUN: --cuda-path=%S/Inputs/CUDA/usr/local/cuda %s 2>&1 \ |
148 | // RUN: | FileCheck %s -check-prefix CUDA70 |
149 | |
150 | // CHECK: Found CUDA installation: {{.*}}/Inputs/CUDA/usr/local/cuda |
151 | // NO-LIBDEVICE: Found CUDA installation: {{.*}}/Inputs/CUDA-nolibdevice/usr/local/cuda |
152 | // NOCUDA-NOT: Found CUDA installation: |
153 | |
154 | // MISSINGLIBDEVICE: error: cannot find libdevice for sm_20. |
155 | |
156 | // COMMON: "-triple" "nvptx-nvidia-cuda" |
157 | // COMMON-SAME: "-fcuda-is-device" |
158 | // LIBDEVICE-SAME: "-mlink-builtin-bitcode" |
159 | // NOLIBDEVICE-NOT: "-mlink-builtin-bitcode" |
160 | // LIBDEVICE20-SAME: libdevice.compute_20.10.bc |
161 | // LIBDEVICE30-SAME: libdevice.compute_30.10.bc |
162 | // LIBDEVICE35-SAME: libdevice.compute_35.10.bc |
163 | // LIBDEVICE50-SAME: libdevice.compute_50.10.bc |
164 | // NOLIBDEVICE-NOT: libdevice.compute_{{.*}}.bc |
165 | // LIBDEVICE-SAME: "-target-feature" "+ptx42" |
166 | // NOLIBDEVICE-NOT: "-target-feature" "+ptx42" |
167 | // CUDAINC-SAME: "-internal-isystem" "{{.*}}/Inputs/CUDA{{[_0-9]+}}/usr/local/cuda/include" |
168 | // NOCUDAINC-NOT: "-internal-isystem" "{{.*}}/cuda/include" |
169 | // CUDAINC-SAME: "-include" "__clang_cuda_runtime_wrapper.h" |
170 | // NOCUDAINC-NOT: "-include" "__clang_cuda_runtime_wrapper.h" |
171 | // -internal-externc-isystem flags must come *after* the cuda include flags, |
172 | // because we must search the cuda include directory first. |
173 | // CUDAINC-SAME: "-internal-externc-isystem" |
174 | // COMMON-SAME: "-x" "cuda" |
175 | // CHECK-CXXINCLUDE: clang{{.*}} "-cc1" "-triple" "nvptx64-nvidia-cuda" |
176 | // CHECK-CXXINCLUDE-SAME: {{.*}}"-internal-isystem" "{{.+}}/include/c++/4.8" |
177 | // CHECK-CXXINCLUDE: clang{{.*}} "-cc1" "-triple" "x86_64-unknown-linux-gnu" |
178 | // CHECK-CXXINCLUDE-SAME: {{.*}}"-internal-isystem" "{{.+}}/include/c++/4.8" |
179 | // CHECK-CXXINCLUDE: ld{{.*}}" |
180 | |
181 | // CUDA80: "-cc1" "-triple" "nvptx64-nvidia-cuda" |
182 | // CUDA80-SAME: -target-sdk-version=8.0 |
183 | // CUDA80: "-cc1" "-triple" "x86_64-unknown-linux-gnu" |
184 | // CUDA80-SAME: -target-sdk-version=8.0 |
185 | // CUDA80: ld{{.*}}" |
186 | |
187 | // CUDA70: "-cc1" "-triple" "nvptx64-nvidia-cuda" |
188 | // CUDA70-SAME: -target-sdk-version=7.0 |
189 | // CUDA70: "-cc1" "-triple" "x86_64-unknown-linux-gnu" |
190 | // CUDA70-SAME: -target-sdk-version=7.0 |
191 | // CUDA70: ld{{.*}}" |
192 | |