blob: c9440666d99b50591a392118ce2b55745fb7b161 [file] [log] [blame]
# This test generates all variants of load/store instructions and verifies that
# LLVM generates correct PTX for them.
# RUN: python %s > %t.ll
# RUN: llc < %t.ll -march=nvptx64 -mcpu=sm_30 | FileCheck -check-prefixes=CHECK,CHECK_P64 %t.ll
# RUN: llc < %t.ll -march=nvptx -mcpu=sm_30 | FileCheck -check-prefixes=CHECK,CHECK_P32 %t.ll
from itertools import product
from string import Template
llvm_type_to_ptx_type = {
"i8": "u8",
"i16": "u16",
"i32": "u32",
"i64": "u64",
"half": "b16",
"<2 x half>": "b32",
"float": "f32",
"double": "f64"
}
llvm_type_to_ptx_reg = {
"i8": "r",
"i16": "r",
"i32": "r",
"i64": "rd",
"half": "h",
"<2 x half>": "hh",
"float": "f",
"double": "fd"
}
addrspace_id = {
"": 0,
".global": 1,
".shared": 3,
".const": 4,
".local": 5,
".param": 101
}
def gen_load_tests():
load_template = """
define ${type} @ld${_volatile}${_space}.${ptx_type}(${type} addrspace(${asid})* %ptr) {
; CHECK_P32: ld${_volatile}${_volatile_as}.${ptx_type} %${ptx_reg}{{[0-9]+}}, [%r{{[0-9]+}}]
; CHECK_P64: ld${_volatile}${_volatile_as}.${ptx_type} %${ptx_reg}{{[0-9]+}}, [%rd{{[0-9]+}}]
; CHECK: ret
%p = ${generic_ptr}
%a = load ${volatile} ${type}, ${type}* %p
ret ${type} %a
}
"""
for op_type, volatile, space in product(
["i8", "i16", "i32", "i64", "half", "float", "double", "<2 x half>"],
[True, False], # volatile
["", ".shared", ".global", ".const", ".local", ".param"]):
# Volatile is only supported for global, shared and generic.
if volatile and not space in ["", ".global", ".shared"]:
continue
# Volatile is only supported for global, shared and generic.
# All other volatile accesses are done in generic AS.
if volatile and not space in ["", ".global", ".shared"]:
volatile_as = ""
else:
volatile_as = space
params = {
"type": op_type,
"volatile": "volatile" if volatile else "",
"_volatile": ".volatile" if volatile else "",
"_volatile_as": volatile_as,
"_space": space,
"ptx_reg": llvm_type_to_ptx_reg[op_type],
"ptx_type": llvm_type_to_ptx_type[op_type],
"asid": addrspace_id[space],
}
# LLVM does not accept "addrspacecast Type* addrspace(0) to Type*", so we
# need to avoid it for generic pointer tests.
if space:
generic_ptr_template = ("addrspacecast ${type} addrspace(${asid})* %ptr "
"to ${type}*")
else:
generic_ptr_template = "select i1 true, ${type}* %ptr, ${type}* %ptr"
params["generic_ptr"] = Template(generic_ptr_template).substitute(params)
print(Template(load_template).substitute(params))
def main():
gen_load_tests()
main()