|  | ; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py UTC_ARGS: --version 4 | 
|  | ; RUN: llc -mtriple=aarch64 %s -o - | FileCheck %s --check-prefixes=CHECK,CHECK-SD | 
|  | ; RUN: llc -mtriple=aarch64 -global-isel %s -o - | FileCheck %s --check-prefixes=CHECK,CHECK-GI | 
|  |  | 
|  | ; ====== Scalar Tests ===== | 
|  |  | 
|  | ; ====== Scalar bswap.i16 Tests ===== | 
|  | define i16 @bswap_i16_to_i16_anyext(i16 %a){ | 
|  | ; CHECK-SD-LABEL: bswap_i16_to_i16_anyext: | 
|  | ; CHECK-SD:       // %bb.0: | 
|  | ; CHECK-SD-NEXT:    rev16 w0, w0 | 
|  | ; CHECK-SD-NEXT:    ret | 
|  | ; | 
|  | ; CHECK-GI-LABEL: bswap_i16_to_i16_anyext: | 
|  | ; CHECK-GI:       // %bb.0: | 
|  | ; CHECK-GI-NEXT:    rev w8, w0 | 
|  | ; CHECK-GI-NEXT:    lsr w0, w8, #16 | 
|  | ; CHECK-GI-NEXT:    ret | 
|  | %3 = call i16 @llvm.bswap.i16(i16 %a) | 
|  | ret i16 %3 | 
|  | } | 
|  | declare i16 @llvm.bswap.i16(i16) | 
|  |  | 
|  | ; The zext here is optimised to an any_extend during isel. | 
|  | define i64 @bswap_i16_to_i64_anyext(i16 %a) { | 
|  | ; CHECK-SD-LABEL: bswap_i16_to_i64_anyext: | 
|  | ; CHECK-SD:       // %bb.0: | 
|  | ; CHECK-SD-NEXT:    // kill: def $w0 killed $w0 def $x0 | 
|  | ; CHECK-SD-NEXT:    rev16 x8, x0 | 
|  | ; CHECK-SD-NEXT:    lsl x0, x8, #48 | 
|  | ; CHECK-SD-NEXT:    ret | 
|  | ; | 
|  | ; CHECK-GI-LABEL: bswap_i16_to_i64_anyext: | 
|  | ; CHECK-GI:       // %bb.0: | 
|  | ; CHECK-GI-NEXT:    rev w8, w0 | 
|  | ; CHECK-GI-NEXT:    lsr w8, w8, #16 | 
|  | ; CHECK-GI-NEXT:    and x8, x8, #0xffff | 
|  | ; CHECK-GI-NEXT:    lsl x0, x8, #48 | 
|  | ; CHECK-GI-NEXT:    ret | 
|  | %3 = call i16 @llvm.bswap.i16(i16 %a) | 
|  | %4 = zext i16 %3 to i64 | 
|  | %5 = shl i64 %4, 48 | 
|  | ret i64 %5 | 
|  | } | 
|  |  | 
|  | ; The zext here is optimised to an any_extend during isel.. | 
|  | define i128 @bswap_i16_to_i128_anyext(i16 %a) { | 
|  | ; CHECK-SD-LABEL: bswap_i16_to_i128_anyext: | 
|  | ; CHECK-SD:       // %bb.0: | 
|  | ; CHECK-SD-NEXT:    mov w8, w0 | 
|  | ; CHECK-SD-NEXT:    mov x0, xzr | 
|  | ; CHECK-SD-NEXT:    rev w8, w8 | 
|  | ; CHECK-SD-NEXT:    lsr w8, w8, #16 | 
|  | ; CHECK-SD-NEXT:    lsl x1, x8, #48 | 
|  | ; CHECK-SD-NEXT:    ret | 
|  | ; | 
|  | ; CHECK-GI-LABEL: bswap_i16_to_i128_anyext: | 
|  | ; CHECK-GI:       // %bb.0: | 
|  | ; CHECK-GI-NEXT:    mov w8, w0 | 
|  | ; CHECK-GI-NEXT:    mov x0, xzr | 
|  | ; CHECK-GI-NEXT:    rev w8, w8 | 
|  | ; CHECK-GI-NEXT:    lsr w8, w8, #16 | 
|  | ; CHECK-GI-NEXT:    and x8, x8, #0xffff | 
|  | ; CHECK-GI-NEXT:    lsl x1, x8, #48 | 
|  | ; CHECK-GI-NEXT:    ret | 
|  | %3 = call i16 @llvm.bswap.i16(i16 %a) | 
|  | %4 = zext i16 %3 to i128 | 
|  | %5 = shl i128 %4, 112 | 
|  | ret i128 %5 | 
|  | } | 
|  |  | 
|  | define i32 @bswap_i16_to_i32_zext(i16 %a){ | 
|  | ; CHECK-LABEL: bswap_i16_to_i32_zext: | 
|  | ; CHECK:       // %bb.0: | 
|  | ; CHECK-NEXT:    rev w8, w0 | 
|  | ; CHECK-NEXT:    lsr w0, w8, #16 | 
|  | ; CHECK-NEXT:    ret | 
|  | %3 = call i16 @llvm.bswap.i16(i16 %a) | 
|  | %4 = zext i16 %3 to i32 | 
|  | ret i32 %4 | 
|  | } | 
|  |  | 
|  | ; ====== Other scalar bswap tests ===== | 
|  | define i32 @bswap_i32(i32 %a){ | 
|  | ; CHECK-LABEL: bswap_i32: | 
|  | ; CHECK:       // %bb.0: | 
|  | ; CHECK-NEXT:    rev w0, w0 | 
|  | ; CHECK-NEXT:    ret | 
|  | %3 = call i32 @llvm.bswap.i32(i32 %a) | 
|  | ret i32 %3 | 
|  | } | 
|  | declare i32 @llvm.bswap.i32(i32) | 
|  |  | 
|  | define i64 @bswap_i64(i64 %a){ | 
|  | ; CHECK-LABEL: bswap_i64: | 
|  | ; CHECK:       // %bb.0: | 
|  | ; CHECK-NEXT:    rev x0, x0 | 
|  | ; CHECK-NEXT:    ret | 
|  | %3 = call i64 @llvm.bswap.i64(i64 %a) | 
|  | ret i64 %3 | 
|  | } | 
|  | declare i64 @llvm.bswap.i64(i64) | 
|  |  | 
|  | define i128 @bswap_i128(i128 %a){ | 
|  | ; CHECK-LABEL: bswap_i128: | 
|  | ; CHECK:       // %bb.0: | 
|  | ; CHECK-NEXT:    rev x8, x1 | 
|  | ; CHECK-NEXT:    rev x1, x0 | 
|  | ; CHECK-NEXT:    mov x0, x8 | 
|  | ; CHECK-NEXT:    ret | 
|  | %3 = call i128 @llvm.bswap.i128(i128 %a) | 
|  | ret i128 %3 | 
|  | } | 
|  | declare i128 @llvm.bswap.i128(i128) | 
|  |  | 
|  | ; ===== Legal Vector Type Tests ===== | 
|  |  | 
|  | define <4 x i16> @bswap_v4i16(<4 x i16> %a){ | 
|  | ; CHECK-LABEL: bswap_v4i16: | 
|  | ; CHECK:       // %bb.0: | 
|  | ; CHECK-NEXT:    rev16 v0.8b, v0.8b | 
|  | ; CHECK-NEXT:    ret | 
|  | %3 = call <4 x i16> @llvm.bswap.v4i16(<4 x i16> %a) | 
|  | ret <4 x i16> %3 | 
|  | } | 
|  | declare <4 x i16> @llvm.bswap.v4i16(<4 x i16>) | 
|  |  | 
|  | define <8 x i16> @bswap_v8i16(<8 x i16> %a){ | 
|  | ; CHECK-LABEL: bswap_v8i16: | 
|  | ; CHECK:       // %bb.0: | 
|  | ; CHECK-NEXT:    rev16 v0.16b, v0.16b | 
|  | ; CHECK-NEXT:    ret | 
|  | %3 = call <8 x i16> @llvm.bswap.v8i16(<8 x i16> %a) | 
|  | ret <8 x i16> %3 | 
|  | } | 
|  | declare <8 x i16> @llvm.bswap.v8i16(<8 x i16>) | 
|  |  | 
|  | define <2 x i32> @bswap_v2i32(<2 x i32> %a){ | 
|  | ; CHECK-LABEL: bswap_v2i32: | 
|  | ; CHECK:       // %bb.0: | 
|  | ; CHECK-NEXT:    rev32 v0.8b, v0.8b | 
|  | ; CHECK-NEXT:    ret | 
|  | %3 = call <2 x i32> @llvm.bswap.v2i32(<2 x i32> %a) | 
|  | ret <2 x i32> %3 | 
|  | } | 
|  | declare <2 x i32> @llvm.bswap.v2i32(<2 x i32>) | 
|  |  | 
|  | define <4 x i32> @bswap_v4i32(<4 x i32> %a){ | 
|  | ; CHECK-LABEL: bswap_v4i32: | 
|  | ; CHECK:       // %bb.0: | 
|  | ; CHECK-NEXT:    rev32 v0.16b, v0.16b | 
|  | ; CHECK-NEXT:    ret | 
|  | %3 = call <4 x i32> @llvm.bswap.v4i32(<4 x i32> %a) | 
|  | ret <4 x i32> %3 | 
|  | } | 
|  | declare <4 x i32> @llvm.bswap.v4i32(<4 x i32>) | 
|  |  | 
|  | define <2 x i64> @bswap_v2i64(<2 x i64> %a){ | 
|  | ; CHECK-LABEL: bswap_v2i64: | 
|  | ; CHECK:       // %bb.0: | 
|  | ; CHECK-NEXT:    rev64 v0.16b, v0.16b | 
|  | ; CHECK-NEXT:    ret | 
|  | %3 = call <2 x i64> @llvm.bswap.v2i64(<2 x i64> %a) | 
|  | ret <2 x i64> %3 | 
|  | } | 
|  | declare <2 x i64> @llvm.bswap.v2i64(<2 x i64>) | 
|  |  | 
|  | ; ===== Smaller/Larger Width Vectors with Legal Element Sizes ===== | 
|  |  | 
|  | define <2 x i16> @bswap_v2i16(<2 x i16> %a){ | 
|  | ; CHECK-SD-LABEL: bswap_v2i16: | 
|  | ; CHECK-SD:       // %bb.0: // %entry | 
|  | ; CHECK-SD-NEXT:    rev32 v0.8b, v0.8b | 
|  | ; CHECK-SD-NEXT:    ushr v0.2s, v0.2s, #16 | 
|  | ; CHECK-SD-NEXT:    ret | 
|  | ; | 
|  | ; CHECK-GI-LABEL: bswap_v2i16: | 
|  | ; CHECK-GI:       // %bb.0: // %entry | 
|  | ; CHECK-GI-NEXT:    uzp1 v0.4h, v0.4h, v0.4h | 
|  | ; CHECK-GI-NEXT:    rev16 v0.8b, v0.8b | 
|  | ; CHECK-GI-NEXT:    ushll v0.4s, v0.4h, #0 | 
|  | ; CHECK-GI-NEXT:    // kill: def $d0 killed $d0 killed $q0 | 
|  | ; CHECK-GI-NEXT:    ret | 
|  | entry: | 
|  | %res = call <2 x i16> @llvm.bswap.v2i16(<2 x i16> %a) | 
|  | ret <2 x i16> %res | 
|  | } | 
|  | declare <2 x i16> @llvm.bswap.v2i16(<2 x i16>) | 
|  |  | 
|  | define <16 x i16> @bswap_v16i16(<16 x i16> %a){ | 
|  | ; CHECK-LABEL: bswap_v16i16: | 
|  | ; CHECK:       // %bb.0: // %entry | 
|  | ; CHECK-NEXT:    rev16 v0.16b, v0.16b | 
|  | ; CHECK-NEXT:    rev16 v1.16b, v1.16b | 
|  | ; CHECK-NEXT:    ret | 
|  | entry: | 
|  | %res = call <16 x i16> @llvm.bswap.v16i16(<16 x i16> %a) | 
|  | ret <16 x i16> %res | 
|  | } | 
|  | declare <16 x i16> @llvm.bswap.v16i16(<16 x i16>) | 
|  |  | 
|  | define <1 x i32> @bswap_v1i32(<1 x i32> %a){ | 
|  | ; CHECK-SD-LABEL: bswap_v1i32: | 
|  | ; CHECK-SD:       // %bb.0: // %entry | 
|  | ; CHECK-SD-NEXT:    rev32 v0.8b, v0.8b | 
|  | ; CHECK-SD-NEXT:    ret | 
|  | ; | 
|  | ; CHECK-GI-LABEL: bswap_v1i32: | 
|  | ; CHECK-GI:       // %bb.0: // %entry | 
|  | ; CHECK-GI-NEXT:    fmov w8, s0 | 
|  | ; CHECK-GI-NEXT:    rev w8, w8 | 
|  | ; CHECK-GI-NEXT:    mov v0.s[0], w8 | 
|  | ; CHECK-GI-NEXT:    // kill: def $d0 killed $d0 killed $q0 | 
|  | ; CHECK-GI-NEXT:    ret | 
|  | entry: | 
|  | %res = call <1 x i32> @llvm.bswap.v1i32(<1 x i32> %a) | 
|  | ret <1 x i32> %res | 
|  | } | 
|  | declare <1 x i32> @llvm.bswap.v1i32(<1 x i32>) | 
|  |  | 
|  | define <8 x i32> @bswap_v8i32(<8 x i32> %a){ | 
|  | ; CHECK-LABEL: bswap_v8i32: | 
|  | ; CHECK:       // %bb.0: // %entry | 
|  | ; CHECK-NEXT:    rev32 v0.16b, v0.16b | 
|  | ; CHECK-NEXT:    rev32 v1.16b, v1.16b | 
|  | ; CHECK-NEXT:    ret | 
|  | entry: | 
|  | %res = call <8 x i32> @llvm.bswap.v8i32(<8 x i32> %a) | 
|  | ret <8 x i32> %res | 
|  | } | 
|  | declare <8 x i32> @llvm.bswap.v8i32(<8 x i32>) | 
|  |  | 
|  | define <4 x i64> @bswap_v4i64(<4 x i64> %a){ | 
|  | ; CHECK-LABEL: bswap_v4i64: | 
|  | ; CHECK:       // %bb.0: // %entry | 
|  | ; CHECK-NEXT:    rev64 v0.16b, v0.16b | 
|  | ; CHECK-NEXT:    rev64 v1.16b, v1.16b | 
|  | ; CHECK-NEXT:    ret | 
|  | entry: | 
|  | %res = call <4 x i64> @llvm.bswap.v4i64(<4 x i64> %a) | 
|  | ret <4 x i64> %res | 
|  | } | 
|  | declare <4 x i64> @llvm.bswap.v4i64(<4 x i64>) | 
|  |  | 
|  | ; ===== Vectors with Non-Pow 2 Widths ===== | 
|  |  | 
|  | define <3 x i16> @bswap_v3i16(<3 x i16> %a){ | 
|  | ; CHECK-LABEL: bswap_v3i16: | 
|  | ; CHECK:       // %bb.0: // %entry | 
|  | ; CHECK-NEXT:    rev16 v0.8b, v0.8b | 
|  | ; CHECK-NEXT:    ret | 
|  | entry: | 
|  | %res = call <3 x i16> @llvm.bswap.v3i16(<3 x i16> %a) | 
|  | ret <3 x i16> %res | 
|  | } | 
|  | declare <3 x i16> @llvm.bswap.v3i16(<3 x i16>) | 
|  |  | 
|  | define <7 x i16> @bswap_v7i16(<7 x i16> %a){ | 
|  | ; CHECK-LABEL: bswap_v7i16: | 
|  | ; CHECK:       // %bb.0: // %entry | 
|  | ; CHECK-NEXT:    rev16 v0.16b, v0.16b | 
|  | ; CHECK-NEXT:    ret | 
|  | entry: | 
|  | %res = call <7 x i16> @llvm.bswap.v7i16(<7 x i16> %a) | 
|  | ret <7 x i16> %res | 
|  | } | 
|  | declare <7 x i16> @llvm.bswap.v7i16(<7 x i16>) | 
|  |  | 
|  | define <3 x i32> @bswap_v3i32(<3 x i32> %a){ | 
|  | ; CHECK-LABEL: bswap_v3i32: | 
|  | ; CHECK:       // %bb.0: // %entry | 
|  | ; CHECK-NEXT:    rev32 v0.16b, v0.16b | 
|  | ; CHECK-NEXT:    ret | 
|  | entry: | 
|  | %res = call <3 x i32> @llvm.bswap.v3i32(<3 x i32> %a) | 
|  | ret <3 x i32> %res | 
|  | } | 
|  | declare <3 x i32> @llvm.bswap.v3i32(<3 x i32>) |