blob: 0706882236d86a699d2e83cb577ac0d24669cf1c [file] [log] [blame]
; Test the NVVM reflect pass functionality: verifying that reflect calls are replaced with
; appropriate values based on command-line options. Verify that we can handle custom reflect arguments
; that aren't __CUDA_ARCH or __CUDA_FTZ. If that argument is given a value on the command-line,
; the reflect call should be replaced with that value. Otherwise, the reflect call should be replaced with 0.
; RUN: opt -passes=nvvm-reflect -mtriple=nvptx-nvidia-cuda \
; RUN: -nvvm-reflect-add __CUDA_FTZ=1 -nvvm-reflect-add __CUDA_ARCH=350 %s -S \
; RUN: | FileCheck %s --check-prefixes=COMMON,FTZ1,ARCH350,CUSTOM-ABSENT
; RUN: opt -passes=nvvm-reflect -mtriple=nvptx-nvidia-cuda \
; RUN: -nvvm-reflect-add __CUDA_FTZ=0 -nvvm-reflect-add __CUDA_ARCH=520 %s -S \
; RUN: | FileCheck %s --check-prefixes=COMMON,FTZ0,ARCH520,CUSTOM-ABSENT
; RUN: opt -passes=nvvm-reflect -mtriple=nvptx-nvidia-cuda \
; RUN: -nvvm-reflect-add __CUDA_FTZ=0 -nvvm-reflect-add __CUDA_ARCH=520 \
; RUN: -nvvm-reflect-add __CUSTOM_VALUE=42 %s -S \
; RUN: | FileCheck %s --check-prefixes=COMMON,CUSTOM-PRESENT
; To ensure that command line options override module options, create a copy of this test file
; with module options appended and rerun some tests.
; RUN: cat %s > %t.options
; RUN: echo '!llvm.module.flags = !{!0}' >> %t.options
; RUN: echo '!0 = !{i32 4, !"nvvm-reflect-ftz", i32 1}' >> %t.options
; RUN: opt -passes=nvvm-reflect -mtriple=nvptx-nvidia-cuda \
; RUN: -nvvm-reflect-add __CUDA_FTZ=0 -nvvm-reflect-add __CUDA_ARCH=520 %t.options -S \
; RUN: | FileCheck %s --check-prefixes=COMMON,FTZ0,ARCH520
declare i32 @__nvvm_reflect(ptr)
@ftz = private unnamed_addr addrspace(1) constant [11 x i8] c"__CUDA_FTZ\00"
@arch = private unnamed_addr addrspace(1) constant [12 x i8] c"__CUDA_ARCH\00"
@custom = private unnamed_addr addrspace(1) constant [15 x i8] c"__CUSTOM_VALUE\00"
; COMMON-LABEL: define i32 @test_ftz()
; FTZ1: ret i32 1
; FTZ0: ret i32 0
define i32 @test_ftz() {
%1 = call i32 @__nvvm_reflect(ptr addrspacecast (ptr addrspace(1) @ftz to ptr))
ret i32 %1
}
; COMMON-LABEL: define i32 @test_arch()
; ARCH350: ret i32 350
; ARCH520: ret i32 520
define i32 @test_arch() {
%1 = call i32 @__nvvm_reflect(ptr addrspacecast (ptr addrspace(1) @arch to ptr))
ret i32 %1
}
; COMMON-LABEL: define i32 @test_custom()
; CUSTOM-ABSENT: ret i32 0
; CUSTOM-PRESENT: ret i32 42
define i32 @test_custom() {
%1 = call i32 @__nvvm_reflect(ptr addrspacecast (ptr addrspace(1) @custom to ptr))
ret i32 %1
}