| // RUN: mlir-opt %s -split-input-file -test-vector-linearize -verify-diagnostics | FileCheck %s |
| |
| // CHECK-LABEL: test_linearize |
| // CHECK-SAME: (%[[ORIG_ARG:.*]]: vector<2x2xf32>) |
| func.func @test_linearize(%arg0: vector<2x2xf32>) -> vector<2x2xf32> { |
| |
| // CHECK: %[[ARG:.*]] = vector.shape_cast %[[ORIG_ARG]] : vector<2x2xf32> to vector<4xf32> |
| // CHECK: %[[CST:.*]] = arith.constant dense<[1.000000e+00, 2.000000e+00, 3.000000e+00, 4.000000e+00]> : vector<4xf32> |
| // CHECK: %[[RES:.*]] = vector.shape_cast %[[CST]] : vector<4xf32> to vector<2x2xf32> |
| %0 = arith.constant dense<[[1.0, 2.0], [3.0, 4.0]]> : vector<2x2xf32> |
| |
| // CHECK: %{{.*}} = math.sin %[[ARG]] : vector<4xf32> |
| %1 = math.sin %arg0 : vector<2x2xf32> |
| |
| // CHECK: %{{.*}} = arith.addf %[[ARG]], %[[CST]] : vector<4xf32> |
| %2 = arith.addf %arg0, %0 : vector<2x2xf32> |
| |
| // CHECK: return %[[RES]] : vector<2x2xf32> |
| return %0 : vector<2x2xf32> |
| } |
| |
| // ----- |
| |
| // CHECK-LABEL: test_linearize_poison |
| func.func @test_linearize_poison() -> vector<2x2xf32> { |
| |
| // CHECK: %[[POISON:.*]] = ub.poison : vector<4xf32> |
| // CHECK: %[[RES:.*]] = vector.shape_cast %[[POISON]] : vector<4xf32> to vector<2x2xf32> |
| %0 = ub.poison : vector<2x2xf32> |
| |
| // CHECK: return %[[RES]] : vector<2x2xf32> |
| return %0 : vector<2x2xf32> |
| } |
| |
| // ----- |
| |
| // CHECK-LABEL: test_partial_linearize |
| // CHECK-SAME: (%[[ORIG_ARG:.*]]: vector<2x2xf32>, %[[ORIG_ARG2:.*]]: vector<4x4xf32>) |
| func.func @test_partial_linearize(%arg0: vector<2x2xf32>, %arg1: vector<4x4xf32>) -> vector<2x2xf32> { |
| |
| // CHECK-DAG: %[[ARG:.*]] = vector.shape_cast %[[ORIG_ARG]] : vector<2x2xf32> to vector<4xf32> |
| // CHECK-DAG: %[[ARG2:.*]] = vector.shape_cast %[[ORIG_ARG2]] : vector<4x4xf32> to vector<16xf32> |
| // CHECK: %[[CST:.*]] = arith.constant dense<{{.*}}> : vector<4xf32> |
| // CHECK: %[[RES:.*]] = vector.shape_cast %[[CST]] : vector<4xf32> to vector<2x2xf32> |
| %0 = arith.constant dense<[[1.0, 2.0], [3.0, 4.0]]> : vector<2x2xf32> |
| |
| // CHECK: %[[C2:.*]] = arith.constant dense<{{.*}}> : vector<16xf32> |
| %5 = arith.constant dense<[[1.0, 2.0, 3.0, 4.0], [1.0, 2.0,3.0, 4.0], [1.0, 2.0, 3.0, 4.0], [1.0, 2.0, 5.0, 6.0]]> : vector<4x4xf32> |
| |
| // Arith and math ops are handled in generic way, check some of them |
| // CHECK: %[[SIN:.*]] = math.sin %[[ARG]] : vector<4xf32> |
| %1 = math.sin %arg0 : vector<2x2xf32> |
| |
| // CHECK: %[[SIN1:.*]] = math.sin %[[ARG2]] : vector<16xf32> |
| %6 = math.sin %arg1 : vector<4x4xf32> |
| |
| // CHECK: %{{.*}} = arith.addf %[[ARG]], %[[CST]] : vector<4xf32> |
| %2 = arith.addf %arg0, %0 : vector<2x2xf32> |
| |
| // CHECK: %[[ADD2:.*]] = arith.addf %[[ARG2]], %[[C2]] : vector<16xf32> |
| %7 = arith.addf %arg1, %5 : vector<4x4xf32> |
| |
| // CHECK: return %[[RES]] : vector<2x2xf32> |
| return %0 : vector<2x2xf32> |
| } |
| |
| // ----- |
| |
| // vectorizable operation (arith.mulf) with tensor result types. |
| |
| // CHECK-LABEL: test_tensor_no_linearize |
| func.func @test_tensor_no_linearize(%arg0: tensor<2x2xf32>, %arg1: tensor<2x2xf32>) -> (tensor<2x2xf32>, tensor<2x2xf32>) { |
| |
| // CHECK: %[[MULF:.*]] = arith.mulf %arg0, %arg1 : tensor<2x2xf32> |
| %0 = arith.mulf %arg0, %arg1 : tensor<2x2xf32> |
| |
| return %0, %arg0 : tensor<2x2xf32>, tensor<2x2xf32> |
| } |
| |
| // ----- |
| |
| // CHECK-LABEL: func.func @test_scalable_linearize( |
| // CHECK-SAME: %[[ARG_0:.*]]: vector<2x[2]xf32>) -> vector<2x[2]xf32> { |
| func.func @test_scalable_linearize(%arg0: vector<2x[2]xf32>) -> vector<2x[2]xf32> { |
| |
| // CHECK: %[[SC:.*]] = vector.shape_cast %[[ARG_0]] : vector<2x[2]xf32> to vector<[4]xf32> |
| // CHECK: %[[CST:.*]] = arith.constant dense<3.000000e+00> : vector<[4]xf32> |
| %0 = arith.constant dense<[[3., 3.], [3., 3.]]> : vector<2x[2]xf32> |
| |
| // CHECK: %[[SIN:.*]] = math.sin %[[SC]] : vector<[4]xf32> |
| %1 = math.sin %arg0 : vector<2x[2]xf32> |
| |
| // CHECK: %[[ADDF:.*]] = arith.addf %[[SIN]], %[[CST]] : vector<[4]xf32> |
| %2 = arith.addf %0, %1 : vector<2x[2]xf32> |
| |
| // CHECK: %[[RES:.*]] = vector.shape_cast %[[ADDF]] : vector<[4]xf32> to vector<2x[2]xf32> |
| // CHECK: return %[[RES]] : vector<2x[2]xf32> |
| return %2 : vector<2x[2]xf32> |
| } |
| |
| // ----- |
| |
| // CHECK-LABEL: func.func @test_scalable_no_linearize( |
| // CHECK-SAME: %[[VAL_0:.*]]: vector<[2]x[2]xf32>) -> vector<[2]x[2]xf32> { |
| func.func @test_scalable_no_linearize(%arg0: vector<[2]x[2]xf32>) -> vector<[2]x[2]xf32> { |
| |
| // CHECK: %[[CST:.*]] = arith.constant dense<2.000000e+00> : vector<[2]x[2]xf32> |
| %0 = arith.constant dense<[[2., 2.], [2., 2.]]> : vector<[2]x[2]xf32> |
| |
| // CHECK: %[[SIN:.*]] = math.sin %[[VAL_0]] : vector<[2]x[2]xf32> |
| %1 = math.sin %arg0 : vector<[2]x[2]xf32> |
| |
| // CHECK: %[[RES:.*]] = arith.addf %[[CST]], %[[SIN]] : vector<[2]x[2]xf32> |
| %2 = arith.addf %0, %1 : vector<[2]x[2]xf32> |
| |
| // CHECK: return %[[RES]] : vector<[2]x[2]xf32> |
| return %2 : vector<[2]x[2]xf32> |
| } |
| |
| // ----- |
| |
| // CHECK-LABEL: func.func @test_0d_vector |
| func.func @test_0d_vector() -> vector<f32> { |
| |
| // CHECK: %[[CST:.+]] = arith.constant dense<0.000000e+00> : vector<f32> |
| %0 = arith.constant dense<0.0> : vector<f32> |
| |
| // CHECK: return %[[CST]] |
| return %0 : vector<f32> |
| } |
| |
| // ----- |
| |
| // CHECK-LABEL: test_extract_strided_slice_2D |
| // CHECK-SAME: (%[[ORIG_ARG:.*]]: vector<4x8xf32>) -> vector<2x2xf32> { |
| func.func @test_extract_strided_slice_2D(%arg0 : vector<4x8xf32>) -> vector<2x2xf32> { |
| |
| // CHECK: %[[ARG:.*]] = vector.shape_cast %[[ORIG_ARG]] : vector<4x8xf32> to vector<32xf32> |
| // CHECK: %[[SHUFFLE:.*]] = vector.shuffle %[[ARG]], %[[ARG]] |
| // CHECK-SAME: [4, 5, 12, 13] : vector<32xf32>, vector<32xf32> |
| // CHECK: %[[RES:.*]] = vector.shape_cast %[[SHUFFLE]] : vector<4xf32> to vector<2x2xf32> |
| // CHECK: return %[[RES]] : vector<2x2xf32 |
| %0 = vector.extract_strided_slice %arg0 { sizes = [2, 2], strides = [1, 1], offsets = [0, 4]} |
| : vector<4x8xf32> to vector<2x2xf32> |
| return %0 : vector<2x2xf32> |
| } |
| |
| // ----- |
| |
| // CHECK-LABEL: func.func @test_extract_strided_slice_2D_scalable( |
| // CHECK-SAME: %[[VAL_0:.*]]: vector<4x[8]xf32>) -> vector<2x[8]xf32> { |
| func.func @test_extract_strided_slice_2D_scalable(%arg0: vector<4x[8]xf32>) -> vector<2x[8]xf32> { |
| |
| // CHECK-NOT: vector.shuffle |
| // CHECK-NOT: vector.shape_cast |
| // CHECK: %[[RES:.*]] = vector.extract_strided_slice %[[VAL_0]] |
| %0 = vector.extract_strided_slice %arg0 { sizes = [2, 8], strides = [1, 1], offsets = [1, 0] } : vector<4x[8]xf32> to vector<2x[8]xf32> |
| |
| // CHECK: return %[[RES]] : vector<2x[8]xf32> |
| return %0 : vector<2x[8]xf32> |
| } |
| |
| // ----- |
| |
| // CHECK-LABEL: test_extract_strided_slice_3D |
| // CHECK-SAME: (%[[ORIG_ARG:.*]]: vector<2x8x2xf32>) -> vector<1x4x2xf32> { |
| func.func @test_extract_strided_slice_3D(%arg0 : vector<2x8x2xf32>) -> vector<1x4x2xf32> { |
| |
| // CHECK: %[[ARG:.*]] = vector.shape_cast %[[ORIG_ARG]] : vector<2x8x2xf32> to vector<32xf32> |
| // CHECK: %[[SHUFFLE:.*]] = vector.shuffle %[[ARG]], %[[ARG]] |
| // CHECK-SAME: [20, 21, 22, 23, 24, 25, 26, 27] : vector<32xf32>, vector<32xf32> |
| // CHECK: %[[RES:.*]] = vector.shape_cast %[[SHUFFLE]] : vector<8xf32> to vector<1x4x2xf32> |
| // CHECK: return %[[RES]] : vector<1x4x2xf32> |
| %0 = vector.extract_strided_slice %arg0 { offsets = [1, 2], strides = [1, 1], sizes = [1, 4] } |
| : vector<2x8x2xf32> to vector<1x4x2xf32> |
| return %0 : vector<1x4x2xf32> |
| } |
| |
| // ----- |
| |
| // Test of insert_strided_slice -> shuffle. |
| // This is a contiguous insertion of 4 elements at offset 6 into a vector of 12 elements. |
| // CHECK-LABEL: insert_strided_slice_2D_into_4D |
| func.func @insert_strided_slice_2D_into_4D(%arg0 : vector<2x2xi8>, %arg1 : vector<2x1x3x2xi8>) -> vector<2x1x3x2xi8> { |
| |
| // CHECK-DAG: %[[ARG0:.*]] = vector.shape_cast {{.*}} to vector<4xi8> |
| // CHECK-DAG: %[[ARG1:.*]] = vector.shape_cast {{.*}} to vector<12xi8> |
| // CHECK: vector.shuffle %[[ARG1]], %[[ARG0]] |
| // CHECK-SAME: [0, 1, 2, 3, 4, 5, 12, 13, 14, 15, 10, 11] : vector<12xi8>, vector<4xi8> |
| %0 = vector.insert_strided_slice %arg0, %arg1 {offsets = [1, 0, 0, 0], strides = [1, 1]} : vector<2x2xi8> into vector<2x1x3x2xi8> |
| |
| // CHECK: %[[RES:.*]] = vector.shape_cast {{.*}} to vector<2x1x3x2xi8> |
| // CHECK: return %[[RES]] : vector<2x1x3x2xi8> |
| return %0 : vector<2x1x3x2xi8> |
| } |
| |
| // ----- |
| |
| // Test of insert_strided_slice -> shuffle. |
| // [[[0, 1], [2, 3], [4, 5]], [[6, 7], [8, 9], [10, 11]], [[12, 13], [14, 15]], [[16, 17]]] |
| // ^ ^ |
| // | | |
| // where the 2 elements are inserted into the 3x3x2 vector |
| // CHECK-LABEL: insert_strided_slice_3D |
| func.func @insert_strided_slice_3D(%arg0 : vector<1x2x1xi8>, %arg1 : vector<3x3x2xi8>) -> vector<3x3x2xi8> { |
| |
| // CHECK-DAG: %[[ARG0:.*]] = vector.shape_cast {{.*}} to vector<2xi8> |
| // CHECK-DAG: %[[ARG1:.*]] = vector.shape_cast {{.*}} to vector<18xi8> |
| // CHECK: vector.shuffle %[[ARG1]], %[[ARG0]] |
| // CHECK-SAME: [0, 1, 2, 3, 4, 5, 6, 7, 8, 18, 10, 19, 12, 13, 14, 15, 16, 17] : vector<18xi8>, vector<2xi8> |
| %0 = vector.insert_strided_slice %arg0, %arg1 {offsets = [1, 1, 1], sizes = [1, 2, 1], strides = [1, 1, 1]} : vector<1x2x1xi8> into vector<3x3x2xi8> |
| |
| // CHECK: %[[RES:.*]] = vector.shape_cast {{.*}} to vector<3x3x2xi8> |
| // CHECK: return %[[RES]] : vector<3x3x2xi8> |
| return %0 : vector<3x3x2xi8> |
| } |
| |
| // ----- |
| |
| // CHECK-LABEL: insert_strided_slice_2D_higher_offsets |
| func.func @insert_strided_slice_2D_higher_offsets(%arg0 : vector<2x1xi8>, %arg1 : vector<2x2xi8>, %arg2 : vector<5x2xi8>) -> vector<5x2xi8> { |
| |
| // CHECK: [0, 1, 2, 3, 10, 11, 12, 13, 8, 9] |
| // ^^^ ^^^ ^^^ ^^^ |
| // insertion indices |
| %0 = vector.insert_strided_slice %arg1, %arg2 {offsets = [2, 0], sizes = [2, 2], strides = [1, 1]} : vector<2x2xi8> into vector<5x2xi8> |
| |
| // CHECK: [0, 1, 2, 3, 10, 5, 11, 7, 8, 9] |
| // ^^^ ^^^ |
| %1 = vector.insert_strided_slice %arg0, %0 {offsets = [2, 0], sizes = [2, 1], strides = [1, 1]} : vector<2x1xi8> into vector<5x2xi8> |
| |
| // CHECK: [0, 1, 2, 3, 4, 5, 6, 10, 8, 11] |
| // ^^^ ^^^ |
| %2 = vector.insert_strided_slice %arg0, %1 {offsets = [3, 1], sizes = [2, 1], strides = [1, 1]} : vector<2x1xi8> into vector<5x2xi8> |
| |
| return %2 : vector<5x2xi8> |
| } |
| |
| // ----- |
| |
| // CHECK-LABEL: negative_insert_strided_slice_scalable |
| // CHECK-NOT: vector.shuffle |
| // CHECK: return |
| func.func @negative_insert_strided_slice_scalable(%arg0 : vector<1x[2]xi8>, %arg1 : vector<2x[2]xi8>) -> vector<2x[2]xi8> { |
| %0 = vector.insert_strided_slice %arg0, %arg1 {offsets = [0, 0], strides = [1,1]} : vector<1x[2]xi8> into vector<2x[2]xi8> |
| return %0 : vector<2x[2]xi8> |
| } |
| |
| // ----- |
| |
| // CHECK-LABEL: test_vector_shuffle |
| // CHECK-SAME: (%[[ORIG_ARG0:.*]]: vector<4x2xf32>, %[[ORIG_ARG1:.*]]: vector<4x2xf32>) -> vector<8x2xf32> { |
| func.func @test_vector_shuffle(%arg0: vector<4x2xf32>, %arg1: vector<4x2xf32>) -> vector<8x2xf32> { |
| |
| // CHECK-DAG: %[[ARG0:.*]] = vector.shape_cast %[[ORIG_ARG0]] : vector<4x2xf32> to vector<8xf32> |
| // CHECK-DAG: %[[ARG1:.*]] = vector.shape_cast %[[ORIG_ARG1]] : vector<4x2xf32> to vector<8xf32> |
| // CHECK: %[[SHUFFLE:.*]] = vector.shuffle %[[ARG0]], %[[ARG1]] |
| // CHECK-SAME: [0, 1, 8, 9, 2, 3, 10, 11, 4, 5, 12, 13, 6, 7, 14, 15] : vector<8xf32>, vector<8xf32> |
| // CHECK: %[[RES:.*]] = vector.shape_cast %[[SHUFFLE]] : vector<16xf32> to vector<8x2xf32> |
| // CHECK: return %[[RES]] : vector<8x2xf32> |
| %0 = vector.shuffle %arg0, %arg1 [0, 4, 1, 5, 2, 6, 3, 7] : vector<4x2xf32>, vector<4x2xf32> |
| return %0 : vector<8x2xf32> |
| } |
| |
| // ----- |
| |
| // CHECK-LABEL: test_vector_extract_scalar |
| // CHECK-SAME: (%[[ARG:.*]]: vector<2x4xi32>) -> i32 { |
| func.func @test_vector_extract_scalar(%arg0 : vector<2x4xi32>) -> i32 { |
| |
| // CHECK: %[[SRC_1D:.*]] = vector.shape_cast %[[ARG]] : vector<2x4xi32> to vector<8xi32> |
| // CHECK: %[[EXTRACT_1D:.*]] = vector.extract %[[SRC_1D]][6] : i32 from vector<8xi32> |
| // CHECK: return %[[EXTRACT_1D]] : i32 |
| %0 = vector.extract %arg0[1, 2] : i32 from vector<2x4xi32> |
| return %0 : i32 |
| } |
| |
| // ----- |
| |
| // CHECK-LABEL: test_vector_extract |
| // CHECK-SAME: (%[[ORIG_ARG:.*]]: vector<2x8x2xf32>) -> vector<8x2xf32> { |
| func.func @test_vector_extract(%arg0: vector<2x8x2xf32>) -> vector<8x2xf32> { |
| |
| // CHECK: %[[ARG:.*]] = vector.shape_cast %[[ORIG_ARG]] : vector<2x8x2xf32> to vector<32xf32> |
| // CHECK: %[[SHUFFLE:.*]] = vector.shuffle %[[ARG]], %[[ARG]] |
| // CHECK-SAME: [16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31] : vector<32xf32>, vector<32xf32> |
| // CHECK: %[[RES:.*]] = vector.shape_cast %[[SHUFFLE]] : vector<16xf32> to vector<8x2xf32> |
| // CHECK: return %[[RES]] : vector<8x2xf32> |
| %0 = vector.extract %arg0[1]: vector<8x2xf32> from vector<2x8x2xf32> |
| return %0 : vector<8x2xf32> |
| } |
| |
| // ----- |
| |
| // CHECK-LABEL: func.func @test_vector_extract_scalable( |
| // CHECK-SAME: %[[VAL_0:.*]]: vector<2x8x[2]xf32>) -> vector<8x[2]xf32> { |
| func.func @test_vector_extract_scalable(%arg0: vector<2x8x[2]xf32>) -> vector<8x[2]xf32> { |
| |
| // CHECK-NOT: vector.shuffle |
| // CHECK-NOT: vector.shape_cast |
| // CHECK: %[[RES:.*]] = vector.extract %[[VAL_0]][1] : vector<8x[2]xf32> from vector<2x8x[2]xf32> |
| %0 = vector.extract %arg0[1]: vector<8x[2]xf32> from vector<2x8x[2]xf32> |
| |
| // CHECK: return %[[RES]] : vector<8x[2]xf32> |
| return %0 : vector<8x[2]xf32> |
| } |
| |
| // ----- |
| |
| // CHECK-LABEL: test_vector_insert_scalar |
| // CHECK-SAME: (%[[DEST:.*]]: vector<2x4xf32>, %[[SRC:.*]]: f32) -> vector<2x4xf32> { |
| func.func @test_vector_insert_scalar(%arg0: vector<2x4xf32>, %arg1: f32) -> vector<2x4xf32> { |
| |
| // CHECK: %[[DEST_1D:.*]] = vector.shape_cast %[[DEST]] : vector<2x4xf32> to vector<8xf32> |
| // CHECK: %[[INSERT_1D:.*]] = vector.insert %[[SRC]], %[[DEST_1D]] [6] : f32 into vector<8xf32> |
| // CHECK: %[[RES:.*]] = vector.shape_cast %[[INSERT_1D]] : vector<8xf32> to vector<2x4xf32> |
| // CHECK: return %[[RES]] : vector<2x4xf32> |
| %0 = vector.insert %arg1, %arg0[1, 2]: f32 into vector<2x4xf32> |
| return %0 : vector<2x4xf32> |
| } |
| |
| // ----- |
| |
| // CHECK-LABEL: test_vector_insert |
| // CHECK-SAME: (%[[DEST:.*]]: vector<2x8x4xf32>, %[[SRC:.*]]: vector<8x4xf32>) -> vector<2x8x4xf32> { |
| func.func @test_vector_insert(%arg0: vector<2x8x4xf32>, %arg1: vector<8x4xf32>) -> vector<2x8x4xf32> { |
| |
| // CHECK-DAG: %[[ARG_SRC:.*]] = vector.shape_cast %[[SRC]] : vector<8x4xf32> to vector<32xf32> |
| // CHECK-DAG: %[[ARG_DEST:.*]] = vector.shape_cast %[[DEST]] : vector<2x8x4xf32> to vector<64xf32> |
| // CHECK: %[[SHUFFLE:.*]] = vector.shuffle %[[ARG_DEST]], %[[ARG_SRC]] |
| // CHECK-SAME: [64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, |
| // CHECK-SAME: 88, 89, 90, 91, 92, 93, 94, 95, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, |
| // CHECK-SAME: 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63] : vector<64xf32>, vector<32xf32> |
| // CHECK: %[[RES:.*]] = vector.shape_cast %[[SHUFFLE]] : vector<64xf32> to vector<2x8x4xf32> |
| // CHECK: return %[[RES]] : vector<2x8x4xf32> |
| %0 = vector.insert %arg1, %arg0[0]: vector<8x4xf32> into vector<2x8x4xf32> |
| return %0 : vector<2x8x4xf32> |
| } |
| |
| // ----- |
| |
| // CHECK-LABEL: func.func @test_vector_insert_scalable( |
| // CHECK-SAME: %[[VAL_0:.*]]: vector<2x8x[4]xf32>, %[[VAL_1:.*]]: vector<8x[4]xf32>) -> vector<2x8x[4]xf32> { |
| func.func @test_vector_insert_scalable(%arg0: vector<2x8x[4]xf32>, %arg1: vector<8x[4]xf32>) -> vector<2x8x[4]xf32> { |
| |
| // CHECK-NOT: vector.shuffle |
| // CHECK-NOT: vector.shape_cast |
| // CHECK: %[[RES:.*]] = vector.insert %[[VAL_1]], %[[VAL_0]] [0] : vector<8x[4]xf32> into vector<2x8x[4]xf32> |
| |
| %0 = vector.insert %arg1, %arg0[0]: vector<8x[4]xf32> into vector<2x8x[4]xf32> |
| // CHECK: return %[[RES]] : vector<2x8x[4]xf32> |
| return %0 : vector<2x8x[4]xf32> |
| } |
| |
| // ----- |
| |
| // CHECK-LABEL: test_vector_bitcast |
| // CHECK-SAME: %[[ARG_0:.*]]: vector<4x4xf32> |
| func.func @test_vector_bitcast(%arg0: vector<4x4xf32>) -> vector<4x8xf16> { |
| |
| // CHECK: %[[DOWNCAST:.*]] = vector.shape_cast %[[ARG_0]] : vector<4x4xf32> to vector<16xf32> |
| // CHECK: %[[BITCAST:.*]] = vector.bitcast %[[DOWNCAST]] : vector<16xf32> to vector<32xf16> |
| // CHECK: %[[UPCAST:.*]] = vector.shape_cast %[[BITCAST]] : vector<32xf16> to vector<4x8xf16> |
| %1 = vector.bitcast %arg0 : vector<4x4xf32> to vector<4x8xf16> |
| return %1 : vector<4x8xf16> |
| } |
| |
| // ----- |
| |
| // CHECK-LABEL: test_vector_bitcast |
| // CHECK-SAME: %[[ARG_0:.*]]: vector<4x2xf32> |
| func.func @test_vector_bitcast(%arg0: vector<4x2xf32>) -> vector<4x4xf16> { |
| |
| // CHECK: %[[DOWNCAST:.*]] = vector.shape_cast %[[ARG_0]] : vector<4x2xf32> to vector<8xf32> |
| // CHECK: %[[BITCAST:.*]] = vector.bitcast %[[DOWNCAST]] : vector<8xf32> to vector<16xf16> |
| // CHECK: %[[UPCAST:.*]] = vector.shape_cast %[[BITCAST]] : vector<16xf16> to vector<4x4xf16> |
| %1 = vector.bitcast %arg0 : vector<4x2xf32> to vector<4x4xf16> |
| return %1 : vector<4x4xf16> |
| } |
| |
| // ----- |
| |
| // CHECK-LABEL: test_vector_bitcast |
| // CHECK-SAME: %[[ARG_0:.*]]: vector<4x[2]xf32> |
| func.func @test_vector_bitcast(%arg0: vector<4x[2]xf32>) -> vector<4x[4]xf16> { |
| |
| // CHECK: %[[DOWNCAST:.*]] = vector.shape_cast %[[ARG_0]] : vector<4x[2]xf32> to vector<[8]xf32> |
| // CHECK: %[[BITCAST:.*]] = vector.bitcast %[[DOWNCAST]] : vector<[8]xf32> to vector<[16]xf16> |
| // CHECK: %[[UPCAST:.*]] = vector.shape_cast %[[BITCAST]] : vector<[16]xf16> to vector<4x[4]xf16> |
| %1 = vector.bitcast %arg0 : vector<4x[2]xf32> to vector<4x[4]xf16> |
| return %1 : vector<4x[4]xf16> |
| } |
| |
| // ----- |
| |
| // CHECK-LABEL: test_vector_bitcast |
| // CHECK-SAME: %[[ARG_0:.*]]: vector<[4]x2xf32> |
| func.func @test_vector_bitcast(%arg0: vector<[4]x2xf32>) -> vector<[4]x4xf16> { |
| |
| // CHECK: %[[DOWNCAST:.*]] = vector.shape_cast %[[ARG_0]] : vector<[4]x2xf32> to vector<[8]xf32> |
| // CHECK: %[[BITCAST:.*]] = vector.bitcast %[[DOWNCAST]] : vector<[8]xf32> to vector<[16]xf16> |
| // CHECK: %[[UPCAST:.*]] = vector.shape_cast %[[BITCAST]] : vector<[16]xf16> to vector<[4]x4xf16> |
| %1 = vector.bitcast %arg0 : vector<[4]x2xf32> to vector<[4]x4xf16> |
| return %1 : vector<[4]x4xf16> |
| } |
| |
| // ----- |
| |
| // CHECK-LABEL: test_linearize_across_for |
| func.func @test_linearize_across_for(%arg0 : vector<4xi8>) -> vector<4xi8> { |
| %0 = vector.shape_cast %arg0 : vector<4xi8> to vector<2x2xi8> |
| %c0 = arith.constant 0 : index |
| %c1 = arith.constant 1 : index |
| %c4 = arith.constant 4 : index |
| |
| // CHECK: scf.for {{.*}} -> (vector<4xi8>) |
| %1 = scf.for %i = %c0 to %c4 step %c1 iter_args(%arg1 = %0) -> (vector<2x2xi8>) { |
| |
| // CHECK: arith.addi {{.*}} : vector<4xi8> |
| %2 = arith.addi %arg1, %0 : vector<2x2xi8> |
| |
| // CHECK: scf.yield {{.*}} : vector<4xi8> |
| scf.yield %2 : vector<2x2xi8> |
| } |
| %3 = vector.shape_cast %1 : vector<2x2xi8> to vector<4xi8> |
| return %3 : vector<4xi8> |
| } |
| |
| // ----- |
| |
| // CHECK-LABEL: linearize_vector_broadcast_scalar_source |
| // CHECK-SAME: (%[[ARG:.*]]: i32) -> vector<4x2xi32> |
| func.func @linearize_vector_broadcast_scalar_source(%arg0: i32) -> vector<4x2xi32> { |
| |
| // CHECK: %[[BROADCAST:.*]] = vector.broadcast %[[ARG]] : i32 to vector<8xi32> |
| // CHECK: %[[CAST:.*]] = vector.shape_cast %[[BROADCAST]] : vector<8xi32> to vector<4x2xi32> |
| // CHECK: return %[[CAST]] : vector<4x2xi32> |
| %0 = vector.broadcast %arg0 : i32 to vector<4x2xi32> |
| return %0 : vector<4x2xi32> |
| } |
| |
| // ----- |
| |
| // CHECK-LABEL: linearize_vector_broadcast_rank_two_source |
| // CHECK-SAME: (%[[ARG:.*]]: vector<1x1xi32>) -> vector<4x2xi32> |
| func.func @linearize_vector_broadcast_rank_two_source(%arg0: vector<1x1xi32>) -> vector<4x2xi32> { |
| |
| // CHECK: %[[CAST0:.*]] = vector.shape_cast %[[ARG]] : vector<1x1xi32> to vector<1xi32> |
| // CHECK: %[[BROADCAST:.*]] = vector.broadcast %[[CAST0]] : vector<1xi32> to vector<8xi32> |
| // CHECK: %[[CAST1:.*]] = vector.shape_cast %[[BROADCAST]] : vector<8xi32> to vector<4x2xi32> |
| // CHECK: return %[[CAST1]] : vector<4x2xi32> |
| %0 = vector.broadcast %arg0 : vector<1x1xi32> to vector<4x2xi32> |
| return %0 : vector<4x2xi32> |
| } |
| |
| // ----- |
| |
| // CHECK-LABEL: linearize_scalable_vector_broadcast |
| // CHECK-SAME: (%[[ARG:.*]]: i32) -> vector<4x[2]xi32> |
| func.func @linearize_scalable_vector_broadcast(%arg0: i32) -> vector<4x[2]xi32> { |
| |
| // CHECK: %[[BROADCAST:.*]] = vector.broadcast %[[ARG]] : i32 to vector<[8]xi32> |
| // CHECK: %[[CAST:.*]] = vector.shape_cast %[[BROADCAST]] : vector<[8]xi32> to vector<4x[2]xi32> |
| // CHECK: return %[[CAST]] : vector<4x[2]xi32> |
| %0 = vector.broadcast %arg0 : i32 to vector<4x[2]xi32> |
| return %0 : vector<4x[2]xi32> |
| |
| } |
| |
| // ----- |
| |
| // CHECK-LABEL: linearize_create_mask |
| // CHECK-SAME: (%[[ARG0:.*]]: index, %[[ARG1:.*]]: index) -> vector<1x16xi1> |
| func.func @linearize_create_mask(%arg0 : index, %arg1 : index) -> vector<1x16xi1> { |
| |
| // CHECK: %[[C0:.*]] = arith.constant 0 : index |
| // CHECK: %[[CMP:.*]] = arith.cmpi sgt, %[[ARG0]], %[[C0]] : index |
| // CHECK: %[[INDEXCAST:.*]] = arith.index_cast %[[CMP]] : i1 to index |
| // CHECK: %[[MULI:.*]] = arith.andi %[[INDEXCAST]], %[[ARG1]] : index |
| // CHECK: %[[MASK_1D:.*]] = vector.create_mask %[[MULI]] : vector<16xi1> |
| // CHECK: %[[CAST:.*]] = vector.shape_cast %[[MASK_1D]] : vector<16xi1> to vector<1x16xi1> |
| // CHECK: return %[[CAST]] : vector<1x16xi1> |
| %0 = vector.create_mask %arg0, %arg1 : vector<1x16xi1> |
| return %0 : vector<1x16xi1> |
| } |
| |
| // ----- |
| // CHECK-LABEL: linearize_scalable_create_mask |
| func.func @linearize_scalable_create_mask(%arg0 : index, %arg1 : index) -> vector<1x[16]xi1> { |
| |
| // CHECK: %[[MASK_1D:.*]] = vector.create_mask {{%.*}} : vector<[16]xi1> |
| %0 = vector.create_mask %arg0, %arg1 : vector<1x[16]xi1> |
| return %0 : vector<1x[16]xi1> |
| } |
| |
| // CHECK-LABEL: linearize_vector_load |
| // CHECK-SAME: (%[[ARG0:.*]]: memref<2x8xf32>) -> vector<1x4xf32> |
| func.func @linearize_vector_load(%arg0: memref<2x8xf32>) -> vector<1x4xf32> { |
| // CHECK: %[[CST0:.*]] = arith.constant 0 : index |
| // CHECK: %[[LOAD:.*]] = vector.load %[[ARG0]][%[[CST0]], %[[CST0]]] : memref<2x8xf32>, vector<4xf32> |
| // CHECK: %[[CAST:.*]] = vector.shape_cast %[[LOAD]] : vector<4xf32> to vector<1x4xf32> |
| // CHECK: return %[[CAST]] : vector<1x4xf32> |
| %c0 = arith.constant 0 : index |
| %0 = vector.load %arg0[%c0, %c0] : memref<2x8xf32>, vector<1x4xf32> |
| return %0 : vector<1x4xf32> |
| } |
| |
| // CHECK-LABEL: linearize_vector_store |
| // CHECK-SAME: (%[[ARG0:.*]]: memref<2x8xf32>, %[[ARG1:.*]]: vector<1x4xf32>) |
| func.func @linearize_vector_store(%arg0: memref<2x8xf32>, %arg1: vector<1x4xf32>) { |
| // CHECK: %[[CAST:.*]] = vector.shape_cast %arg1 : vector<1x4xf32> to vector<4xf32> |
| // CHECK: %[[CST0:.*]] = arith.constant 0 : index |
| // CHECK: vector.store %[[CAST]], %[[ARG0]][%[[CST0]], %[[CST0]]] : memref<2x8xf32>, vector<4xf32> |
| %c0 = arith.constant 0 : index |
| vector.store %arg1, %arg0[%c0, %c0] : memref<2x8xf32>, vector<1x4xf32> |
| return |
| } |
| |
| // CHECK-LABEL: linearize_vector_load_scalable |
| // CHECK-SAME: (%[[ARG0:.*]]: memref<2x8xf32>) -> vector<1x[4]xf32> |
| func.func @linearize_vector_load_scalable(%arg0: memref<2x8xf32>) -> vector<1x[4]xf32> { |
| // CHECK: %[[CST0:.*]] = arith.constant 0 : index |
| // CHECK: %[[LOAD:.*]] = vector.load %[[ARG0]][%[[CST0]], %[[CST0]]] : memref<2x8xf32>, vector<[4]xf32> |
| // CHECK: %[[CAST:.*]] = vector.shape_cast %[[LOAD]] : vector<[4]xf32> to vector<1x[4]xf32> |
| // CHECK: return %[[CAST]] : vector<1x[4]xf32> |
| %c0 = arith.constant 0 : index |
| %0 = vector.load %arg0[%c0, %c0] : memref<2x8xf32>, vector<1x[4]xf32> |
| return %0 : vector<1x[4]xf32> |
| } |
| |
| // CHECK-LABEL: linearize_vector_store_scalable |
| // CHECK-SAME: (%[[ARG0:.*]]: memref<2x8xf32>, %[[ARG1:.*]]: vector<1x[4]xf32>) |
| func.func @linearize_vector_store_scalable(%arg0: memref<2x8xf32>, %arg1: vector<1x[4]xf32>) { |
| // CHECK: %[[CAST:.*]] = vector.shape_cast %arg1 : vector<1x[4]xf32> to vector<[4]xf32> |
| // CHECK: %[[CST0:.*]] = arith.constant 0 : index |
| // CHECK: vector.store %[[CAST]], %[[ARG0]][%[[CST0]], %[[CST0]]] : memref<2x8xf32>, vector<[4]xf32> |
| %c0 = arith.constant 0 : index |
| vector.store %arg1, %arg0[%c0, %c0] : memref<2x8xf32>, vector<1x[4]xf32> |
| return |
| } |
| |
| // ----- |
| |
| // Test pattern LinearizeVectorFromElements. |
| |
| // CHECK-LABEL: test_vector_from_elements |
| // CHECK-SAME: %[[ARG_0:.*]]: f32, %[[ARG_1:.*]]: f32, %[[ARG_2:.*]]: f32, %[[ARG_3:.*]]: f32 |
| func.func @test_vector_from_elements(%arg0: f32, %arg1: f32, %arg2: f32, %arg3: f32) -> vector<2x2xf32> { |
| // CHECK: %[[FROM_ELEMENTS:.*]] = vector.from_elements %[[ARG_0]], %[[ARG_1]], %[[ARG_2]], %[[ARG_3]] : vector<4xf32> |
| // CHECK: %[[CAST:.*]] = vector.shape_cast %[[FROM_ELEMENTS]] : vector<4xf32> to vector<2x2xf32> |
| // CHECK: return %[[CAST]] : vector<2x2xf32> |
| %1 = vector.from_elements %arg0, %arg1, %arg2, %arg3 : vector<2x2xf32> |
| return %1 : vector<2x2xf32> |
| } |
| |
| // ----- |
| |
| // CHECK-LABEL: func.func @to_elements_1d( |
| // CHECK-SAME: %[[ARG0:.+]]: vector<2xf32> |
| // CHECK: %[[RES:.+]]:2 = vector.to_elements %[[ARG0]] : vector<2xf32> |
| // CHECK: return %[[RES]]#0, %[[RES]]#1 |
| func.func @to_elements_1d(%arg0: vector<2xf32>) -> (f32, f32) { |
| %0:2 = vector.to_elements %arg0 : vector<2xf32> |
| return %0#0, %0#1 : f32, f32 |
| } |
| |
| // ----- |
| |
| // CHECK-LABEL: func.func @to_elements_2d( |
| // CHECK-SAME: %[[ARG0:.+]]: vector<2x2xf32> |
| // CHECK: %[[CAST:.+]] = vector.shape_cast %[[ARG0]] |
| // CHECK: %[[RES:.+]]:4 = vector.to_elements %[[CAST]] : vector<4xf32> |
| // CHECK: return %[[RES]]#0, %[[RES]]#1, %[[RES]]#2, %[[RES]]#3 |
| func.func @to_elements_2d(%arg0: vector<2x2xf32>) -> (f32, f32, f32, f32) { |
| %0:4 = vector.to_elements %arg0 : vector<2x2xf32> |
| return %0#0, %0#1, %0#2, %0#3 : f32, f32, f32, f32 |
| } |