| // NOTE: Assertions have been autogenerated by utils/update_mc_test_checks.py UTC_ARGS: --version 5 |
| // RUN: llvm-mc -triple=amdgcn -mcpu=gfx1250 -mattr=-real-true16 -show-encoding %s | FileCheck --check-prefix=GFX1250 %s |
| |
| v_mov_b64_e32 v[4:5], v[2:3] |
| // GFX1250: v_mov_b64_e32 v[4:5], v[2:3] ; encoding: [0x02,0x3b,0x08,0x7e] |
| |
| v_mov_b64 v[4:5], v[254:255] |
| // GFX1250: v_mov_b64_e32 v[4:5], v[254:255] ; encoding: [0xfe,0x3b,0x08,0x7e] |
| |
| v_mov_b64 v[4:5], s[2:3] |
| // GFX1250: v_mov_b64_e32 v[4:5], s[2:3] ; encoding: [0x02,0x3a,0x08,0x7e] |
| |
| v_mov_b64 v[4:5], vcc |
| // GFX1250: v_mov_b64_e32 v[4:5], vcc ; encoding: [0x6a,0x3a,0x08,0x7e] |
| |
| v_mov_b64 v[4:5], exec |
| // GFX1250: v_mov_b64_e32 v[4:5], exec ; encoding: [0x7e,0x3a,0x08,0x7e] |
| |
| v_mov_b64 v[4:5], null |
| // GFX1250: v_mov_b64_e32 v[4:5], null ; encoding: [0x7c,0x3a,0x08,0x7e] |
| |
| v_mov_b64 v[4:5], -1 |
| // GFX1250: v_mov_b64_e32 v[4:5], -1 ; encoding: [0xc1,0x3a,0x08,0x7e] |
| |
| v_mov_b64 v[4:5], 0.5 |
| // GFX1250: v_mov_b64_e32 v[4:5], 0.5 ; encoding: [0xf0,0x3a,0x08,0x7e] |
| |
| v_mov_b64 v[254:255], 0xaf123456 |
| // GFX1250: v_mov_b64_e32 v[254:255], lit64(0xaf123456) ; encoding: [0xfe,0x3a,0xfc,0x7f,0x56,0x34,0x12,0xaf,0x00,0x00,0x00,0x00] |
| |
| v_tanh_bf16 v5, v1 |
| // GFX1250: v_tanh_bf16_e32 v5, v1 ; encoding: [0x01,0x95,0x0a,0x7e] |
| |
| v_tanh_bf16 v5, v127 |
| // GFX1250: v_tanh_bf16_e32 v5, v127 ; encoding: [0x7f,0x95,0x0a,0x7e] |
| |
| v_tanh_bf16 v5, s1 |
| // GFX1250: v_tanh_bf16_e32 v5, s1 ; encoding: [0x01,0x94,0x0a,0x7e] |
| |
| v_tanh_bf16 v5, s105 |
| // GFX1250: v_tanh_bf16_e32 v5, s105 ; encoding: [0x69,0x94,0x0a,0x7e] |
| |
| v_tanh_bf16 v5, vcc_lo |
| // GFX1250: v_tanh_bf16_e32 v5, vcc_lo ; encoding: [0x6a,0x94,0x0a,0x7e] |
| |
| v_tanh_bf16 v5, vcc_hi |
| // GFX1250: v_tanh_bf16_e32 v5, vcc_hi ; encoding: [0x6b,0x94,0x0a,0x7e] |
| |
| v_tanh_bf16 v5, ttmp15 |
| // GFX1250: v_tanh_bf16_e32 v5, ttmp15 ; encoding: [0x7b,0x94,0x0a,0x7e] |
| |
| v_tanh_bf16 v5, m0 |
| // GFX1250: v_tanh_bf16_e32 v5, m0 ; encoding: [0x7d,0x94,0x0a,0x7e] |
| |
| v_tanh_bf16 v5, exec_lo |
| // GFX1250: v_tanh_bf16_e32 v5, exec_lo ; encoding: [0x7e,0x94,0x0a,0x7e] |
| |
| v_tanh_bf16 v5, exec_hi |
| // GFX1250: v_tanh_bf16_e32 v5, exec_hi ; encoding: [0x7f,0x94,0x0a,0x7e] |
| |
| v_tanh_bf16 v5, null |
| // GFX1250: v_tanh_bf16_e32 v5, null ; encoding: [0x7c,0x94,0x0a,0x7e] |
| |
| v_tanh_bf16 v5, -1 |
| // GFX1250: v_tanh_bf16_e32 v5, -1 ; encoding: [0xc1,0x94,0x0a,0x7e] |
| |
| v_tanh_bf16 v5, 0.5 |
| // GFX1250: v_tanh_bf16_e32 v5, 0.5 ; encoding: [0xf0,0x94,0x0a,0x7e] |
| |
| v_tanh_bf16 v5, src_scc |
| // GFX1250: v_tanh_bf16_e32 v5, src_scc ; encoding: [0xfd,0x94,0x0a,0x7e] |
| |
| v_tanh_bf16 v127, 0x8000 |
| // GFX1250: v_tanh_bf16_e32 v127, 0x8000 ; encoding: [0xff,0x94,0xfe,0x7e,0x00,0x80,0x00,0x00] |
| |
| v_rcp_bf16 v5, v1 |
| // GFX1250: v_rcp_bf16_e32 v5, v1 ; encoding: [0x01,0xf3,0x0a,0x7e] |
| |
| v_rcp_bf16 v5, v127 |
| // GFX1250: v_rcp_bf16_e32 v5, v127 ; encoding: [0x7f,0xf3,0x0a,0x7e] |
| |
| v_rcp_bf16 v5, s1 |
| // GFX1250: v_rcp_bf16_e32 v5, s1 ; encoding: [0x01,0xf2,0x0a,0x7e] |
| |
| v_rcp_bf16 v5, s105 |
| // GFX1250: v_rcp_bf16_e32 v5, s105 ; encoding: [0x69,0xf2,0x0a,0x7e] |
| |
| v_rcp_bf16 v5, vcc_lo |
| // GFX1250: v_rcp_bf16_e32 v5, vcc_lo ; encoding: [0x6a,0xf2,0x0a,0x7e] |
| |
| v_rcp_bf16 v5, vcc_hi |
| // GFX1250: v_rcp_bf16_e32 v5, vcc_hi ; encoding: [0x6b,0xf2,0x0a,0x7e] |
| |
| v_rcp_bf16 v5, ttmp15 |
| // GFX1250: v_rcp_bf16_e32 v5, ttmp15 ; encoding: [0x7b,0xf2,0x0a,0x7e] |
| |
| v_rcp_bf16 v5, m0 |
| // GFX1250: v_rcp_bf16_e32 v5, m0 ; encoding: [0x7d,0xf2,0x0a,0x7e] |
| |
| v_rcp_bf16 v5, exec_lo |
| // GFX1250: v_rcp_bf16_e32 v5, exec_lo ; encoding: [0x7e,0xf2,0x0a,0x7e] |
| |
| v_rcp_bf16 v5, exec_hi |
| // GFX1250: v_rcp_bf16_e32 v5, exec_hi ; encoding: [0x7f,0xf2,0x0a,0x7e] |
| |
| v_rcp_bf16 v5, null |
| // GFX1250: v_rcp_bf16_e32 v5, null ; encoding: [0x7c,0xf2,0x0a,0x7e] |
| |
| v_rcp_bf16 v5, -1 |
| // GFX1250: v_rcp_bf16_e32 v5, -1 ; encoding: [0xc1,0xf2,0x0a,0x7e] |
| |
| v_rcp_bf16 v5, 0.5 |
| // GFX1250: v_rcp_bf16_e32 v5, 0.5 ; encoding: [0xf0,0xf2,0x0a,0x7e] |
| |
| v_rcp_bf16 v5, src_scc |
| // GFX1250: v_rcp_bf16_e32 v5, src_scc ; encoding: [0xfd,0xf2,0x0a,0x7e] |
| |
| v_rcp_bf16 v127, 0x8000 |
| // GFX1250: v_rcp_bf16_e32 v127, 0x8000 ; encoding: [0xff,0xf2,0xfe,0x7e,0x00,0x80,0x00,0x00] |
| |
| v_sqrt_bf16 v5, v1 |
| // GFX1250: v_sqrt_bf16_e32 v5, v1 ; encoding: [0x01,0xf5,0x0a,0x7e] |
| |
| v_sqrt_bf16 v5, v127 |
| // GFX1250: v_sqrt_bf16_e32 v5, v127 ; encoding: [0x7f,0xf5,0x0a,0x7e] |
| |
| v_sqrt_bf16 v5, s1 |
| // GFX1250: v_sqrt_bf16_e32 v5, s1 ; encoding: [0x01,0xf4,0x0a,0x7e] |
| |
| v_sqrt_bf16 v5, s105 |
| // GFX1250: v_sqrt_bf16_e32 v5, s105 ; encoding: [0x69,0xf4,0x0a,0x7e] |
| |
| v_sqrt_bf16 v5, vcc_lo |
| // GFX1250: v_sqrt_bf16_e32 v5, vcc_lo ; encoding: [0x6a,0xf4,0x0a,0x7e] |
| |
| v_sqrt_bf16 v5, vcc_hi |
| // GFX1250: v_sqrt_bf16_e32 v5, vcc_hi ; encoding: [0x6b,0xf4,0x0a,0x7e] |
| |
| v_sqrt_bf16 v5, ttmp15 |
| // GFX1250: v_sqrt_bf16_e32 v5, ttmp15 ; encoding: [0x7b,0xf4,0x0a,0x7e] |
| |
| v_sqrt_bf16 v5, m0 |
| // GFX1250: v_sqrt_bf16_e32 v5, m0 ; encoding: [0x7d,0xf4,0x0a,0x7e] |
| |
| v_sqrt_bf16 v5, exec_lo |
| // GFX1250: v_sqrt_bf16_e32 v5, exec_lo ; encoding: [0x7e,0xf4,0x0a,0x7e] |
| |
| v_sqrt_bf16 v5, exec_hi |
| // GFX1250: v_sqrt_bf16_e32 v5, exec_hi ; encoding: [0x7f,0xf4,0x0a,0x7e] |
| |
| v_sqrt_bf16 v5, null |
| // GFX1250: v_sqrt_bf16_e32 v5, null ; encoding: [0x7c,0xf4,0x0a,0x7e] |
| |
| v_sqrt_bf16 v5, -1 |
| // GFX1250: v_sqrt_bf16_e32 v5, -1 ; encoding: [0xc1,0xf4,0x0a,0x7e] |
| |
| v_sqrt_bf16 v5, 0.5 |
| // GFX1250: v_sqrt_bf16_e32 v5, 0.5 ; encoding: [0xf0,0xf4,0x0a,0x7e] |
| |
| v_sqrt_bf16 v5, src_scc |
| // GFX1250: v_sqrt_bf16_e32 v5, src_scc ; encoding: [0xfd,0xf4,0x0a,0x7e] |
| |
| v_sqrt_bf16 v127, 0x8000 |
| // GFX1250: v_sqrt_bf16_e32 v127, 0x8000 ; encoding: [0xff,0xf4,0xfe,0x7e,0x00,0x80,0x00,0x00] |
| |
| v_rsq_bf16 v5, v1 |
| // GFX1250: v_rsq_bf16_e32 v5, v1 ; encoding: [0x01,0xf7,0x0a,0x7e] |
| |
| v_rsq_bf16 v5, v127 |
| // GFX1250: v_rsq_bf16_e32 v5, v127 ; encoding: [0x7f,0xf7,0x0a,0x7e] |
| |
| v_rsq_bf16 v5, s1 |
| // GFX1250: v_rsq_bf16_e32 v5, s1 ; encoding: [0x01,0xf6,0x0a,0x7e] |
| |
| v_rsq_bf16 v5, s105 |
| // GFX1250: v_rsq_bf16_e32 v5, s105 ; encoding: [0x69,0xf6,0x0a,0x7e] |
| |
| v_rsq_bf16 v5, vcc_lo |
| // GFX1250: v_rsq_bf16_e32 v5, vcc_lo ; encoding: [0x6a,0xf6,0x0a,0x7e] |
| |
| v_rsq_bf16 v5, vcc_hi |
| // GFX1250: v_rsq_bf16_e32 v5, vcc_hi ; encoding: [0x6b,0xf6,0x0a,0x7e] |
| |
| v_rsq_bf16 v5, ttmp15 |
| // GFX1250: v_rsq_bf16_e32 v5, ttmp15 ; encoding: [0x7b,0xf6,0x0a,0x7e] |
| |
| v_rsq_bf16 v5, m0 |
| // GFX1250: v_rsq_bf16_e32 v5, m0 ; encoding: [0x7d,0xf6,0x0a,0x7e] |
| |
| v_rsq_bf16 v5, exec_lo |
| // GFX1250: v_rsq_bf16_e32 v5, exec_lo ; encoding: [0x7e,0xf6,0x0a,0x7e] |
| |
| v_rsq_bf16 v5, exec_hi |
| // GFX1250: v_rsq_bf16_e32 v5, exec_hi ; encoding: [0x7f,0xf6,0x0a,0x7e] |
| |
| v_rsq_bf16 v5, null |
| // GFX1250: v_rsq_bf16_e32 v5, null ; encoding: [0x7c,0xf6,0x0a,0x7e] |
| |
| v_rsq_bf16 v5, -1 |
| // GFX1250: v_rsq_bf16_e32 v5, -1 ; encoding: [0xc1,0xf6,0x0a,0x7e] |
| |
| v_rsq_bf16 v5, 0.5 |
| // GFX1250: v_rsq_bf16_e32 v5, 0.5 ; encoding: [0xf0,0xf6,0x0a,0x7e] |
| |
| v_rsq_bf16 v5, src_scc |
| // GFX1250: v_rsq_bf16_e32 v5, src_scc ; encoding: [0xfd,0xf6,0x0a,0x7e] |
| |
| v_rsq_bf16 v127, 0x8000 |
| // GFX1250: v_rsq_bf16_e32 v127, 0x8000 ; encoding: [0xff,0xf6,0xfe,0x7e,0x00,0x80,0x00,0x00] |
| |
| v_log_bf16 v5, v1 |
| // GFX1250: v_log_bf16_e32 v5, v1 ; encoding: [0x01,0xf9,0x0a,0x7e] |
| |
| v_log_bf16 v5, v127 |
| // GFX1250: v_log_bf16_e32 v5, v127 ; encoding: [0x7f,0xf9,0x0a,0x7e] |
| |
| v_log_bf16 v5, s1 |
| // GFX1250: v_log_bf16_e32 v5, s1 ; encoding: [0x01,0xf8,0x0a,0x7e] |
| |
| v_log_bf16 v5, s105 |
| // GFX1250: v_log_bf16_e32 v5, s105 ; encoding: [0x69,0xf8,0x0a,0x7e] |
| |
| v_log_bf16 v5, vcc_lo |
| // GFX1250: v_log_bf16_e32 v5, vcc_lo ; encoding: [0x6a,0xf8,0x0a,0x7e] |
| |
| v_log_bf16 v5, vcc_hi |
| // GFX1250: v_log_bf16_e32 v5, vcc_hi ; encoding: [0x6b,0xf8,0x0a,0x7e] |
| |
| v_log_bf16 v5, ttmp15 |
| // GFX1250: v_log_bf16_e32 v5, ttmp15 ; encoding: [0x7b,0xf8,0x0a,0x7e] |
| |
| v_log_bf16 v5, m0 |
| // GFX1250: v_log_bf16_e32 v5, m0 ; encoding: [0x7d,0xf8,0x0a,0x7e] |
| |
| v_log_bf16 v5, exec_lo |
| // GFX1250: v_log_bf16_e32 v5, exec_lo ; encoding: [0x7e,0xf8,0x0a,0x7e] |
| |
| v_log_bf16 v5, exec_hi |
| // GFX1250: v_log_bf16_e32 v5, exec_hi ; encoding: [0x7f,0xf8,0x0a,0x7e] |
| |
| v_log_bf16 v5, null |
| // GFX1250: v_log_bf16_e32 v5, null ; encoding: [0x7c,0xf8,0x0a,0x7e] |
| |
| v_log_bf16 v5, -1 |
| // GFX1250: v_log_bf16_e32 v5, -1 ; encoding: [0xc1,0xf8,0x0a,0x7e] |
| |
| v_log_bf16 v5, 0.5 |
| // GFX1250: v_log_bf16_e32 v5, 0.5 ; encoding: [0xf0,0xf8,0x0a,0x7e] |
| |
| v_log_bf16 v5, src_scc |
| // GFX1250: v_log_bf16_e32 v5, src_scc ; encoding: [0xfd,0xf8,0x0a,0x7e] |
| |
| v_log_bf16 v127, 0x8000 |
| // GFX1250: v_log_bf16_e32 v127, 0x8000 ; encoding: [0xff,0xf8,0xfe,0x7e,0x00,0x80,0x00,0x00] |
| |
| v_cvt_f32_bf16 v5, v1 |
| // GFX1250: v_cvt_f32_bf16_e32 v5, v1 ; encoding: [0x01,0xe5,0x0a,0x7e] |
| |
| v_cvt_f32_bf16 v5, v127 |
| // GFX1250: v_cvt_f32_bf16_e32 v5, v127 ; encoding: [0x7f,0xe5,0x0a,0x7e] |
| |
| v_cvt_f32_bf16 v5, s1 |
| // GFX1250: v_cvt_f32_bf16_e32 v5, s1 ; encoding: [0x01,0xe4,0x0a,0x7e] |
| |
| v_cvt_f32_bf16 v5, s105 |
| // GFX1250: v_cvt_f32_bf16_e32 v5, s105 ; encoding: [0x69,0xe4,0x0a,0x7e] |
| |
| v_cvt_f32_bf16 v5, vcc_lo |
| // GFX1250: v_cvt_f32_bf16_e32 v5, vcc_lo ; encoding: [0x6a,0xe4,0x0a,0x7e] |
| |
| v_cvt_f32_bf16 v5, vcc_hi |
| // GFX1250: v_cvt_f32_bf16_e32 v5, vcc_hi ; encoding: [0x6b,0xe4,0x0a,0x7e] |
| |
| v_cvt_f32_bf16 v5, ttmp15 |
| // GFX1250: v_cvt_f32_bf16_e32 v5, ttmp15 ; encoding: [0x7b,0xe4,0x0a,0x7e] |
| |
| v_cvt_f32_bf16 v5, m0 |
| // GFX1250: v_cvt_f32_bf16_e32 v5, m0 ; encoding: [0x7d,0xe4,0x0a,0x7e] |
| |
| v_cvt_f32_bf16 v5, exec_lo |
| // GFX1250: v_cvt_f32_bf16_e32 v5, exec_lo ; encoding: [0x7e,0xe4,0x0a,0x7e] |
| |
| v_cvt_f32_bf16 v5, exec_hi |
| // GFX1250: v_cvt_f32_bf16_e32 v5, exec_hi ; encoding: [0x7f,0xe4,0x0a,0x7e] |
| |
| v_cvt_f32_bf16 v5, null |
| // GFX1250: v_cvt_f32_bf16_e32 v5, null ; encoding: [0x7c,0xe4,0x0a,0x7e] |
| |
| v_cvt_f32_bf16 v5, -1 |
| // GFX1250: v_cvt_f32_bf16_e32 v5, -1 ; encoding: [0xc1,0xe4,0x0a,0x7e] |
| |
| v_cvt_f32_bf16 v5, 0.5 |
| // GFX1250: v_cvt_f32_bf16_e32 v5, 0.5 ; encoding: [0xf0,0xe4,0x0a,0x7e] |
| |
| v_cvt_f32_bf16 v5, src_scc |
| // GFX1250: v_cvt_f32_bf16_e32 v5, src_scc ; encoding: [0xfd,0xe4,0x0a,0x7e] |
| |
| v_cvt_f32_bf16 v127, 0x8000 |
| // GFX1250: v_cvt_f32_bf16_e32 v127, 0x8000 ; encoding: [0xff,0xe4,0xfe,0x7e,0x00,0x80,0x00,0x00] |
| |
| v_cvt_f16_bf8 v1, v2 |
| // GFX1250: v_cvt_f16_bf8_e32 v1, v2 ; encoding: [0x02,0xf1,0x02,0x7e] |
| |
| v_cvt_f16_bf8 v1, s2 |
| // GFX1250: v_cvt_f16_bf8_e32 v1, s2 ; encoding: [0x02,0xf0,0x02,0x7e] |
| |
| v_cvt_f16_bf8 v1, 2 |
| // GFX1250: v_cvt_f16_bf8_e32 v1, 2 ; encoding: [0x82,0xf0,0x02,0x7e] |
| |
| v_cvt_f16_bf8 v1, 0x1234 |
| // GFX1250: v_cvt_f16_bf8_e32 v1, 0x1234 ; encoding: [0xff,0xf0,0x02,0x7e,0x34,0x12,0x00,0x00] |
| |
| v_cvt_f16_fp8 v1, v2 |
| // GFX1250: v_cvt_f16_fp8_e32 v1, v2 ; encoding: [0x02,0xef,0x02,0x7e] |
| |
| v_cvt_f16_fp8 v1, s2 |
| // GFX1250: v_cvt_f16_fp8_e32 v1, s2 ; encoding: [0x02,0xee,0x02,0x7e] |
| |
| v_cvt_f16_fp8 v1, 2 |
| // GFX1250: v_cvt_f16_fp8_e32 v1, 2 ; encoding: [0x82,0xee,0x02,0x7e] |
| |
| v_cvt_f16_fp8 v1, 0x1234 |
| // GFX1250: v_cvt_f16_fp8_e32 v1, 0x1234 ; encoding: [0xff,0xee,0x02,0x7e,0x34,0x12,0x00,0x00] |
| |
| v_cvt_pk_f16_bf8 v1, v2 |
| // GFX1250: v_cvt_pk_f16_bf8 v1, v2 ; encoding: [0x02,0xed,0x02,0x7e] |
| |
| v_cvt_pk_f16_bf8 v1, s2 |
| // GFX1250: v_cvt_pk_f16_bf8 v1, s2 ; encoding: [0x02,0xec,0x02,0x7e] |
| |
| v_cvt_pk_f16_bf8 v1, 100 |
| // GFX1250: v_cvt_pk_f16_bf8 v1, 0x64 ; encoding: [0xff,0xec,0x02,0x7e,0x64,0x00,0x00,0x00] |
| |
| v_cvt_pk_f16_fp8 v1, v2 |
| // GFX1250: v_cvt_pk_f16_fp8 v1, v2 ; encoding: [0x02,0xeb,0x02,0x7e] |
| |
| v_cvt_pk_f16_fp8 v1, s2 |
| // GFX1250: v_cvt_pk_f16_fp8 v1, s2 ; encoding: [0x02,0xea,0x02,0x7e] |
| |
| v_cvt_pk_f16_fp8 v1, 100 |
| // GFX1250: v_cvt_pk_f16_fp8 v1, 0x64 ; encoding: [0xff,0xea,0x02,0x7e,0x64,0x00,0x00,0x00] |
| |
| v_cvt_f32_bf8_e32 v1, s3 |
| // GFX1250: v_cvt_f32_bf8_e32 v1, s3 ; encoding: [0x03,0xda,0x02,0x7e] |
| |
| v_cvt_f32_bf8_e32 v1, 3 |
| // GFX1250: v_cvt_f32_bf8_e32 v1, 3 ; encoding: [0x83,0xda,0x02,0x7e] |
| |
| v_cvt_f32_bf8_e32 v1, v3 |
| // GFX1250: v_cvt_f32_bf8_e32 v1, v3 ; encoding: [0x03,0xdb,0x02,0x7e] |
| |
| v_cvt_f32_fp8_e32 v1, s3 |
| // GFX1250: v_cvt_f32_fp8_e32 v1, s3 ; encoding: [0x03,0xd8,0x02,0x7e] |
| |
| v_cvt_f32_fp8_e32 v1, 3 |
| // GFX1250: v_cvt_f32_fp8_e32 v1, 3 ; encoding: [0x83,0xd8,0x02,0x7e] |
| |
| v_cvt_f32_fp8_e32 v1, v3 |
| // GFX1250: v_cvt_f32_fp8_e32 v1, v3 ; encoding: [0x03,0xd9,0x02,0x7e] |