| // NOTE: Assertions have been autogenerated by utils/update_cc_test_checks.py |
| // REQUIRES: amdgpu-registered-target |
| // RUN: %clang_cc1 -cl-std=CL2.0 -triple amdgcn-unknown-unknown -target-cpu gfx1250 -emit-llvm -o - %s | FileCheck %s --check-prefix=CHECK-GFX1250 |
| |
| typedef int v4i __attribute__((ext_vector_type(4))); |
| typedef int v8i __attribute__((ext_vector_type(8))); |
| |
| // CHECK-GFX1250-LABEL: @test_amdgcn_tensor_load_to_lds( |
| // CHECK-GFX1250-NEXT: entry: |
| // CHECK-GFX1250-NEXT: tail call void @llvm.amdgcn.tensor.load.to.lds(<4 x i32> [[SG0:%.*]], <8 x i32> [[SG1:%.*]], <4 x i32> [[SG2:%.*]], <4 x i32> [[SG3:%.*]], i32 0) |
| // CHECK-GFX1250-NEXT: ret void |
| // |
| void test_amdgcn_tensor_load_to_lds(v4i sg0, v8i sg1, v4i sg2, v4i sg3) |
| { |
| __builtin_amdgcn_tensor_load_to_lds(sg0, sg1, sg2, sg3, 0); |
| } |
| |
| // CHECK-GFX1250-LABEL: @test_amdgcn_tensor_load_to_lds_d2( |
| // CHECK-GFX1250-NEXT: entry: |
| // CHECK-GFX1250-NEXT: tail call void @llvm.amdgcn.tensor.load.to.lds.d2(<4 x i32> [[SG0:%.*]], <8 x i32> [[SG1:%.*]], i32 27) |
| // CHECK-GFX1250-NEXT: ret void |
| // |
| void test_amdgcn_tensor_load_to_lds_d2(v4i sg0, v8i sg1) |
| { |
| __builtin_amdgcn_tensor_load_to_lds_d2(sg0, sg1, 27); |
| } |
| |
| // CHECK-GFX1250-LABEL: @test_amdgcn_tensor_store_from_lds( |
| // CHECK-GFX1250-NEXT: entry: |
| // CHECK-GFX1250-NEXT: tail call void @llvm.amdgcn.tensor.store.from.lds(<4 x i32> [[SG0:%.*]], <8 x i32> [[SG1:%.*]], <4 x i32> [[SG2:%.*]], <4 x i32> [[SG3:%.*]], i32 22) |
| // CHECK-GFX1250-NEXT: ret void |
| // |
| void test_amdgcn_tensor_store_from_lds(v4i sg0, v8i sg1, v4i sg2, v4i sg3) |
| { |
| __builtin_amdgcn_tensor_store_from_lds(sg0, sg1, sg2, sg3, 22); |
| } |
| |
| // CHECK-GFX1250-LABEL: @test_amdgcn_tensor_store_from_lds_d2( |
| // CHECK-GFX1250-NEXT: entry: |
| // CHECK-GFX1250-NEXT: tail call void @llvm.amdgcn.tensor.store.from.lds.d2(<4 x i32> [[SG0:%.*]], <8 x i32> [[SG1:%.*]], i32 0) |
| // CHECK-GFX1250-NEXT: ret void |
| // |
| void test_amdgcn_tensor_store_from_lds_d2(v4i sg0, v8i sg1) |
| { |
| __builtin_amdgcn_tensor_store_from_lds_d2(sg0, sg1, 0); |
| } |