forked from OSchip/llvm-project
59 lines
3.3 KiB
Plaintext
59 lines
3.3 KiB
Plaintext
// REQUIRES: clang-driver
|
|
// REQUIRES: x86-registered-target
|
|
// REQUIRES: amdgpu-registered-target
|
|
|
|
// RUN: %clang -### -x hip --gpu-max-threads-per-block=1024 %s 2>&1 | FileCheck %s
|
|
|
|
// Check that there are commands for both host- and device-side compilations.
|
|
//
|
|
// CHECK: clang{{.*}}" "-cc1" {{.*}} "-fcuda-is-device"
|
|
// CHECK-SAME: "--gpu-max-threads-per-block=1024"
|
|
|
|
// RUN: %clang -### -nogpuinc -nogpulib -fgpu-allow-device-init \
|
|
// RUN: %s 2>&1 | FileCheck -check-prefix=DEVINIT %s
|
|
// DEVINIT: clang{{.*}}" "-cc1" {{.*}}"-fgpu-allow-device-init"
|
|
// DEVINIT: clang{{.*}}" "-cc1" {{.*}}"-fgpu-allow-device-init"
|
|
|
|
// RUN: %clang -### -x hip -target x86_64-pc-windows-msvc -fms-extensions \
|
|
// RUN: -mllvm -amdgpu-early-inline-all=true %s 2>&1 | \
|
|
// RUN: FileCheck -check-prefix=MLLVM %s
|
|
// MLLVM-NOT: "-mllvm"{{.*}}"-amdgpu-early-inline-all=true"{{.*}}"-mllvm"{{.*}}"-amdgpu-early-inline-all=true"
|
|
|
|
// RUN: %clang -### -Xarch_device -g -nogpulib --cuda-gpu-arch=gfx900 \
|
|
// RUN: -Xarch_device -fcf-protection=branch \
|
|
// RUN: --cuda-gpu-arch=gfx906 %s 2>&1 | FileCheck -check-prefix=DEV %s
|
|
// DEV: clang{{.*}} "-fcuda-is-device" {{.*}} "-debug-info-kind={{.*}}" {{.*}} "-fcf-protection=branch"
|
|
// DEV: clang{{.*}} "-fcuda-is-device" {{.*}} "-debug-info-kind={{.*}}" {{.*}} "-fcf-protection=branch"
|
|
// DEV-NOT: clang{{.*}} {{.*}} "-debug-info-kind={{.*}}"
|
|
|
|
// RUN: %clang -### -Xarch_host -g -nogpulib --cuda-gpu-arch=gfx900 \
|
|
// RUN: --cuda-gpu-arch=gfx906 %s 2>&1 | FileCheck -check-prefix=HOST %s
|
|
// HOST-NOT: clang{{.*}} "-fcuda-is-device" {{.*}} "-debug-info-kind={{.*}}"
|
|
// HOST-NOT: clang{{.*}} "-fcuda-is-device" {{.*}} "-debug-info-kind={{.*}}"
|
|
// HOST: clang{{.*}} "-debug-info-kind={{.*}}"
|
|
|
|
// RUN: %clang -### -nogpuinc -nogpulib -munsafe-fp-atomics \
|
|
// RUN: --cuda-gpu-arch=gfx906 %s 2>&1 | FileCheck -check-prefix=UNSAFE-FP-ATOMICS %s
|
|
// UNSAFE-FP-ATOMICS: clang{{.*}} "-triple" "amdgcn-amd-amdhsa" {{.*}} "-munsafe-fp-atomics"
|
|
|
|
// RUN: %clang -### -nogpuinc -nogpulib \
|
|
// RUN: --cuda-gpu-arch=gfx906 %s 2>&1 | FileCheck -check-prefix=DEFAULT-UNSAFE-FP-ATOMICS %s
|
|
// DEFAULT-UNSAFE-FP-ATOMICS-NOT: clang{{.*}} "-triple" "amdgcn-amd-amdhsa" {{.*}} "-munsafe-fp-atomics"
|
|
|
|
// RUN: %clang -### -target x86_64-unknown-linux-gnu -nogpuinc -nogpulib -fgpu-exclude-wrong-side-overloads \
|
|
// RUN: --cuda-gpu-arch=gfx906 %s 2>&1 | FileCheck -check-prefix=FIX-OVERLOAD %s
|
|
// FIX-OVERLOAD: clang{{.*}} "-triple" "amdgcn-amd-amdhsa" {{.*}} "-fgpu-exclude-wrong-side-overloads" "-fgpu-defer-diag"
|
|
// FIX-OVERLOAD: clang{{.*}} "-triple" "x86_64-unknown-linux-gnu" {{.*}} "-fgpu-exclude-wrong-side-overloads" "-fgpu-defer-diag"
|
|
|
|
// Check -mconstructor-aliases is not passed to device compilation.
|
|
|
|
// RUN: %clang -### -target x86_64-unknown-linux-gnu -nogpuinc -nogpulib \
|
|
// RUN: --cuda-gpu-arch=gfx906 %s 2>&1 | FileCheck -check-prefix=CTA %s
|
|
// CTA: clang{{.*}} "-triple" "x86_64-unknown-linux-gnu" {{.*}} "-mconstructor-aliases"
|
|
// CTA-NOT: clang{{.*}} "-triple" "amdgcn-amd-amdhsa" {{.*}} "-mconstructor-aliases"
|
|
|
|
// RUN: %clang -### -target x86_64-unknown-linux-gnu -nogpuinc -nogpulib \
|
|
// RUN: --offload-arch=gfx906 -fgpu-inline-threshold=1000 %s 2>&1 | FileCheck -check-prefix=THRESH %s
|
|
// THRESH: clang{{.*}} "-triple" "amdgcn-amd-amdhsa" {{.*}} "-mllvm" "-inline-threshold=1000"
|
|
// THRESH-NOT: clang{{.*}} "-triple" "x86_64-unknown-linux-gnu" {{.*}} "-inline-threshold=1000"
|