| // NOTE: Assertions have been autogenerated by utils/update_mc_test_checks.py UTC_ARGS: --version 5 |
| // RUN: llvm-mc -triple=amdgcn -mcpu=gfx1250 -mattr=+real-true16 -show-encoding %s | FileCheck --check-prefix=GFX1250 %s |
| |
| v_tanh_bf16_e64 v5, v1 |
| // GFX1250: v_tanh_bf16_e64 v5, v1 ; encoding: [0x05,0x00,0xca,0xd5,0x01,0x01,0x00,0x00] |
| |
| v_tanh_bf16_e64 v5, v255 |
| // GFX1250: v_tanh_bf16_e64 v5, v255 ; encoding: [0x05,0x00,0xca,0xd5,0xff,0x01,0x00,0x00] |
| |
| v_tanh_bf16_e64 v5, s1 |
| // GFX1250: v_tanh_bf16_e64 v5, s1 ; encoding: [0x05,0x00,0xca,0xd5,0x01,0x00,0x00,0x00] |
| |
| v_tanh_bf16_e64 v5, s105 |
| // GFX1250: v_tanh_bf16_e64 v5, s105 ; encoding: [0x05,0x00,0xca,0xd5,0x69,0x00,0x00,0x00] |
| |
| v_tanh_bf16_e64 v5, vcc_lo |
| // GFX1250: v_tanh_bf16_e64 v5, vcc_lo ; encoding: [0x05,0x00,0xca,0xd5,0x6a,0x00,0x00,0x00] |
| |
| v_tanh_bf16_e64 v5, vcc_hi |
| // GFX1250: v_tanh_bf16_e64 v5, vcc_hi ; encoding: [0x05,0x00,0xca,0xd5,0x6b,0x00,0x00,0x00] |
| |
| v_tanh_bf16_e64 v5, ttmp15 |
| // GFX1250: v_tanh_bf16_e64 v5, ttmp15 ; encoding: [0x05,0x00,0xca,0xd5,0x7b,0x00,0x00,0x00] |
| |
| v_tanh_bf16_e64 v5, m0 |
| // GFX1250: v_tanh_bf16_e64 v5, m0 ; encoding: [0x05,0x00,0xca,0xd5,0x7d,0x00,0x00,0x00] |
| |
| v_tanh_bf16_e64 v5, exec_lo |
| // GFX1250: v_tanh_bf16_e64 v5, exec_lo ; encoding: [0x05,0x00,0xca,0xd5,0x7e,0x00,0x00,0x00] |
| |
| v_tanh_bf16_e64 v5, exec_hi |
| // GFX1250: v_tanh_bf16_e64 v5, exec_hi ; encoding: [0x05,0x00,0xca,0xd5,0x7f,0x00,0x00,0x00] |
| |
| v_tanh_bf16_e64 v5, null |
| // GFX1250: v_tanh_bf16_e64 v5, null ; encoding: [0x05,0x00,0xca,0xd5,0x7c,0x00,0x00,0x00] |
| |
| v_tanh_bf16_e64 v5, -1 |
| // GFX1250: v_tanh_bf16_e64 v5, -1 ; encoding: [0x05,0x00,0xca,0xd5,0xc1,0x00,0x00,0x00] |
| |
| v_tanh_bf16_e64 v5, 0.5 mul:2 |
| // GFX1250: v_tanh_bf16_e64 v5, 0.5 mul:2 ; encoding: [0x05,0x00,0xca,0xd5,0xf0,0x00,0x00,0x08] |
| |
| v_tanh_bf16_e64 v5, src_scc mul:4 |
| // GFX1250: v_tanh_bf16_e64 v5, src_scc mul:4 ; encoding: [0x05,0x00,0xca,0xd5,0xfd,0x00,0x00,0x10] |
| |
| v_tanh_bf16_e64 v255, -|0x8000| clamp div:2 |
| // GFX1250: v_tanh_bf16_e64 v255, -|0x8000| clamp div:2 ; encoding: [0xff,0x81,0xca,0xd5,0xff,0x00,0x00,0x38,0x00,0x80,0x00,0x00] |
| |
| v_tanh_bf16 v5.l, v128.h |
| // GFX1250: v_tanh_bf16_e64 v5.l, v128.h op_sel:[1,0] ; encoding: [0x05,0x08,0xca,0xd5,0x80,0x01,0x00,0x00] |
| |
| v_cvt_f32_bf8_e64 v1, s3 |
| // GFX1250: v_cvt_f32_bf8_e64 v1, s3 ; encoding: [0x01,0x00,0xed,0xd5,0x03,0x00,0x00,0x00] |
| |
| v_cvt_f32_bf8_e64 v1, s3 byte_sel:1 |
| // GFX1250: v_cvt_f32_bf8_e64 v1, s3 byte_sel:1 ; encoding: [0x01,0x10,0xed,0xd5,0x03,0x00,0x00,0x00] |
| |
| v_cvt_f32_bf8_e64 v1, s3 byte_sel:2 |
| // GFX1250: v_cvt_f32_bf8_e64 v1, s3 byte_sel:2 ; encoding: [0x01,0x08,0xed,0xd5,0x03,0x00,0x00,0x00] |
| |
| v_cvt_f32_bf8_e64 v1, s3 byte_sel:3 |
| // GFX1250: v_cvt_f32_bf8_e64 v1, s3 byte_sel:3 ; encoding: [0x01,0x18,0xed,0xd5,0x03,0x00,0x00,0x00] |
| |
| v_cvt_f32_bf8_e64 v1, 3 |
| // GFX1250: v_cvt_f32_bf8_e64 v1, 3 ; encoding: [0x01,0x00,0xed,0xd5,0x83,0x00,0x00,0x00] |
| |
| v_cvt_f32_bf8_e64 v1, 3 byte_sel:1 |
| // GFX1250: v_cvt_f32_bf8_e64 v1, 3 byte_sel:1 ; encoding: [0x01,0x10,0xed,0xd5,0x83,0x00,0x00,0x00] |
| |
| v_cvt_f32_bf8_e64 v1, 3 byte_sel:2 |
| // GFX1250: v_cvt_f32_bf8_e64 v1, 3 byte_sel:2 ; encoding: [0x01,0x08,0xed,0xd5,0x83,0x00,0x00,0x00] |
| |
| v_cvt_f32_bf8_e64 v1, 3 byte_sel:3 |
| // GFX1250: v_cvt_f32_bf8_e64 v1, 3 byte_sel:3 ; encoding: [0x01,0x18,0xed,0xd5,0x83,0x00,0x00,0x00] |
| |
| v_cvt_f32_bf8_e64 v1, v3 |
| // GFX1250: v_cvt_f32_bf8_e64 v1, v3 ; encoding: [0x01,0x00,0xed,0xd5,0x03,0x01,0x00,0x00] |
| |
| v_cvt_f32_bf8_e64 v1, v3 byte_sel:1 |
| // GFX1250: v_cvt_f32_bf8_e64 v1, v3 byte_sel:1 ; encoding: [0x01,0x10,0xed,0xd5,0x03,0x01,0x00,0x00] |
| |
| v_cvt_f32_bf8_e64 v1, v3 byte_sel:2 |
| // GFX1250: v_cvt_f32_bf8_e64 v1, v3 byte_sel:2 ; encoding: [0x01,0x08,0xed,0xd5,0x03,0x01,0x00,0x00] |
| |
| v_cvt_f32_bf8_e64 v1, v3 byte_sel:3 |
| // GFX1250: v_cvt_f32_bf8_e64 v1, v3 byte_sel:3 ; encoding: [0x01,0x18,0xed,0xd5,0x03,0x01,0x00,0x00] |
| |
| v_cvt_f32_fp8_e64 v1, s3 |
| // GFX1250: v_cvt_f32_fp8_e64 v1, s3 ; encoding: [0x01,0x00,0xec,0xd5,0x03,0x00,0x00,0x00] |
| |
| v_cvt_f32_fp8_e64 v1, s3 byte_sel:1 |
| // GFX1250: v_cvt_f32_fp8_e64 v1, s3 byte_sel:1 ; encoding: [0x01,0x10,0xec,0xd5,0x03,0x00,0x00,0x00] |
| |
| v_cvt_f32_fp8_e64 v1, s3 byte_sel:2 |
| // GFX1250: v_cvt_f32_fp8_e64 v1, s3 byte_sel:2 ; encoding: [0x01,0x08,0xec,0xd5,0x03,0x00,0x00,0x00] |
| |
| v_cvt_f32_fp8_e64 v1, s3 byte_sel:3 |
| // GFX1250: v_cvt_f32_fp8_e64 v1, s3 byte_sel:3 ; encoding: [0x01,0x18,0xec,0xd5,0x03,0x00,0x00,0x00] |
| |
| v_cvt_f32_fp8_e64 v1, 3 |
| // GFX1250: v_cvt_f32_fp8_e64 v1, 3 ; encoding: [0x01,0x00,0xec,0xd5,0x83,0x00,0x00,0x00] |
| |
| v_cvt_f32_fp8_e64 v1, 3 byte_sel:1 |
| // GFX1250: v_cvt_f32_fp8_e64 v1, 3 byte_sel:1 ; encoding: [0x01,0x10,0xec,0xd5,0x83,0x00,0x00,0x00] |
| |
| v_cvt_f32_fp8_e64 v1, 3 byte_sel:2 |
| // GFX1250: v_cvt_f32_fp8_e64 v1, 3 byte_sel:2 ; encoding: [0x01,0x08,0xec,0xd5,0x83,0x00,0x00,0x00] |
| |
| v_cvt_f32_fp8_e64 v1, 3 byte_sel:3 |
| // GFX1250: v_cvt_f32_fp8_e64 v1, 3 byte_sel:3 ; encoding: [0x01,0x18,0xec,0xd5,0x83,0x00,0x00,0x00] |
| |
| v_cvt_f32_fp8_e64 v1, v3 |
| // GFX1250: v_cvt_f32_fp8_e64 v1, v3 ; encoding: [0x01,0x00,0xec,0xd5,0x03,0x01,0x00,0x00] |
| |
| v_cvt_f32_fp8_e64 v1, v3 byte_sel:1 |
| // GFX1250: v_cvt_f32_fp8_e64 v1, v3 byte_sel:1 ; encoding: [0x01,0x10,0xec,0xd5,0x03,0x01,0x00,0x00] |
| |
| v_cvt_f32_fp8_e64 v1, v3 byte_sel:2 |
| // GFX1250: v_cvt_f32_fp8_e64 v1, v3 byte_sel:2 ; encoding: [0x01,0x08,0xec,0xd5,0x03,0x01,0x00,0x00] |
| |
| v_cvt_f32_fp8_e64 v1, v3 byte_sel:3 |
| // GFX1250: v_cvt_f32_fp8_e64 v1, v3 byte_sel:3 ; encoding: [0x01,0x18,0xec,0xd5,0x03,0x01,0x00,0x00] |
| |
| v_cvt_f32_fp8_e64 v1, v3 clamp ; encoding: [0x01,0x80,0xec,0xd5,0x03,0x01,0x00,0x00] |
| // GFX1250: v_cvt_f32_fp8_e64 v1, v3 clamp ; encoding: [0x01,0x80,0xec,0xd5,0x03,0x01,0x00,0x00] |
| |
| v_cvt_f32_fp8 v1, v3 byte_sel:1 clamp |
| // GFX1250: v_cvt_f32_fp8_e64 v1, v3 byte_sel:1 clamp ; encoding: [0x01,0x90,0xec,0xd5,0x03,0x01,0x00,0x00] |
| |
| v_cvt_f32_fp8 v1, v3 byte_sel:2 clamp |
| // GFX1250: v_cvt_f32_fp8_e64 v1, v3 byte_sel:2 clamp ; encoding: [0x01,0x88,0xec,0xd5,0x03,0x01,0x00,0x00] |
| |
| v_rcp_bf16_e64 v5, v1 |
| // GFX1250: v_rcp_bf16_e64 v5, v1 ; encoding: [0x05,0x00,0xf9,0xd5,0x01,0x01,0x00,0x00] |
| |
| v_rcp_bf16_e64 v5, v255 |
| // GFX1250: v_rcp_bf16_e64 v5, v255 ; encoding: [0x05,0x00,0xf9,0xd5,0xff,0x01,0x00,0x00] |
| |
| v_rcp_bf16_e64 v5, s1 |
| // GFX1250: v_rcp_bf16_e64 v5, s1 ; encoding: [0x05,0x00,0xf9,0xd5,0x01,0x00,0x00,0x00] |
| |
| v_rcp_bf16_e64 v5, s105 |
| // GFX1250: v_rcp_bf16_e64 v5, s105 ; encoding: [0x05,0x00,0xf9,0xd5,0x69,0x00,0x00,0x00] |
| |
| v_rcp_bf16_e64 v5, vcc_lo |
| // GFX1250: v_rcp_bf16_e64 v5, vcc_lo ; encoding: [0x05,0x00,0xf9,0xd5,0x6a,0x00,0x00,0x00] |
| |
| v_rcp_bf16_e64 v5, vcc_hi |
| // GFX1250: v_rcp_bf16_e64 v5, vcc_hi ; encoding: [0x05,0x00,0xf9,0xd5,0x6b,0x00,0x00,0x00] |
| |
| v_rcp_bf16_e64 v5, ttmp15 |
| // GFX1250: v_rcp_bf16_e64 v5, ttmp15 ; encoding: [0x05,0x00,0xf9,0xd5,0x7b,0x00,0x00,0x00] |
| |
| v_rcp_bf16_e64 v5, m0 |
| // GFX1250: v_rcp_bf16_e64 v5, m0 ; encoding: [0x05,0x00,0xf9,0xd5,0x7d,0x00,0x00,0x00] |
| |
| v_rcp_bf16_e64 v5, exec_lo |
| // GFX1250: v_rcp_bf16_e64 v5, exec_lo ; encoding: [0x05,0x00,0xf9,0xd5,0x7e,0x00,0x00,0x00] |
| |
| v_rcp_bf16_e64 v5, exec_hi |
| // GFX1250: v_rcp_bf16_e64 v5, exec_hi ; encoding: [0x05,0x00,0xf9,0xd5,0x7f,0x00,0x00,0x00] |
| |
| v_rcp_bf16_e64 v5, null |
| // GFX1250: v_rcp_bf16_e64 v5, null ; encoding: [0x05,0x00,0xf9,0xd5,0x7c,0x00,0x00,0x00] |
| |
| v_rcp_bf16_e64 v5, -1 |
| // GFX1250: v_rcp_bf16_e64 v5, -1 ; encoding: [0x05,0x00,0xf9,0xd5,0xc1,0x00,0x00,0x00] |
| |
| v_rcp_bf16_e64 v5, 0.5 mul:2 |
| // GFX1250: v_rcp_bf16_e64 v5, 0.5 mul:2 ; encoding: [0x05,0x00,0xf9,0xd5,0xf0,0x00,0x00,0x08] |
| |
| v_rcp_bf16_e64 v5, src_scc mul:4 |
| // GFX1250: v_rcp_bf16_e64 v5, src_scc mul:4 ; encoding: [0x05,0x00,0xf9,0xd5,0xfd,0x00,0x00,0x10] |
| |
| v_rcp_bf16_e64 v255, -|0x8000| clamp div:2 |
| // GFX1250: v_rcp_bf16_e64 v255, -|0x8000| clamp div:2 ; encoding: [0xff,0x81,0xf9,0xd5,0xff,0x00,0x00,0x38,0x00,0x80,0x00,0x00] |
| |
| v_rcp_bf16 v5.h, v128.h |
| // GFX1250: v_rcp_bf16_e64 v5.h, v128.h op_sel:[1,1] ; encoding: [0x05,0x48,0xf9,0xd5,0x80,0x01,0x00,0x00] |
| |
| v_sqrt_bf16_e64 v5, v1 |
| // GFX1250: v_sqrt_bf16_e64 v5, v1 ; encoding: [0x05,0x00,0xfa,0xd5,0x01,0x01,0x00,0x00] |
| |
| v_sqrt_bf16_e64 v5, v255 |
| // GFX1250: v_sqrt_bf16_e64 v5, v255 ; encoding: [0x05,0x00,0xfa,0xd5,0xff,0x01,0x00,0x00] |
| |
| v_sqrt_bf16_e64 v5, s1 |
| // GFX1250: v_sqrt_bf16_e64 v5, s1 ; encoding: [0x05,0x00,0xfa,0xd5,0x01,0x00,0x00,0x00] |
| |
| v_sqrt_bf16_e64 v5, s105 |
| // GFX1250: v_sqrt_bf16_e64 v5, s105 ; encoding: [0x05,0x00,0xfa,0xd5,0x69,0x00,0x00,0x00] |
| |
| v_sqrt_bf16_e64 v5, vcc_lo |
| // GFX1250: v_sqrt_bf16_e64 v5, vcc_lo ; encoding: [0x05,0x00,0xfa,0xd5,0x6a,0x00,0x00,0x00] |
| |
| v_sqrt_bf16_e64 v5, vcc_hi |
| // GFX1250: v_sqrt_bf16_e64 v5, vcc_hi ; encoding: [0x05,0x00,0xfa,0xd5,0x6b,0x00,0x00,0x00] |
| |
| v_sqrt_bf16_e64 v5, ttmp15 |
| // GFX1250: v_sqrt_bf16_e64 v5, ttmp15 ; encoding: [0x05,0x00,0xfa,0xd5,0x7b,0x00,0x00,0x00] |
| |
| v_sqrt_bf16_e64 v5, m0 |
| // GFX1250: v_sqrt_bf16_e64 v5, m0 ; encoding: [0x05,0x00,0xfa,0xd5,0x7d,0x00,0x00,0x00] |
| |
| v_sqrt_bf16_e64 v5, exec_lo |
| // GFX1250: v_sqrt_bf16_e64 v5, exec_lo ; encoding: [0x05,0x00,0xfa,0xd5,0x7e,0x00,0x00,0x00] |
| |
| v_sqrt_bf16_e64 v5, exec_hi |
| // GFX1250: v_sqrt_bf16_e64 v5, exec_hi ; encoding: [0x05,0x00,0xfa,0xd5,0x7f,0x00,0x00,0x00] |
| |
| v_sqrt_bf16_e64 v5, null |
| // GFX1250: v_sqrt_bf16_e64 v5, null ; encoding: [0x05,0x00,0xfa,0xd5,0x7c,0x00,0x00,0x00] |
| |
| v_sqrt_bf16_e64 v5, -1 |
| // GFX1250: v_sqrt_bf16_e64 v5, -1 ; encoding: [0x05,0x00,0xfa,0xd5,0xc1,0x00,0x00,0x00] |
| |
| v_sqrt_bf16_e64 v5, 0.5 mul:2 |
| // GFX1250: v_sqrt_bf16_e64 v5, 0.5 mul:2 ; encoding: [0x05,0x00,0xfa,0xd5,0xf0,0x00,0x00,0x08] |
| |
| v_sqrt_bf16_e64 v5, src_scc mul:4 |
| // GFX1250: v_sqrt_bf16_e64 v5, src_scc mul:4 ; encoding: [0x05,0x00,0xfa,0xd5,0xfd,0x00,0x00,0x10] |
| |
| v_sqrt_bf16_e64 v255, -|0x8000| clamp div:2 |
| // GFX1250: v_sqrt_bf16_e64 v255, -|0x8000| clamp div:2 ; encoding: [0xff,0x81,0xfa,0xd5,0xff,0x00,0x00,0x38,0x00,0x80,0x00,0x00] |
| |
| v_sqrt_bf16 v5.h, v128.h |
| // GFX1250: v_sqrt_bf16_e64 v5.h, v128.h op_sel:[1,1] ; encoding: [0x05,0x48,0xfa,0xd5,0x80,0x01,0x00,0x00] |
| |
| v_rsq_bf16_e64 v5, v1 |
| // GFX1250: v_rsq_bf16_e64 v5, v1 ; encoding: [0x05,0x00,0xfb,0xd5,0x01,0x01,0x00,0x00] |
| |
| v_rsq_bf16_e64 v5, v255 |
| // GFX1250: v_rsq_bf16_e64 v5, v255 ; encoding: [0x05,0x00,0xfb,0xd5,0xff,0x01,0x00,0x00] |
| |
| v_rsq_bf16_e64 v5, s1 |
| // GFX1250: v_rsq_bf16_e64 v5, s1 ; encoding: [0x05,0x00,0xfb,0xd5,0x01,0x00,0x00,0x00] |
| |
| v_rsq_bf16_e64 v5, s105 |
| // GFX1250: v_rsq_bf16_e64 v5, s105 ; encoding: [0x05,0x00,0xfb,0xd5,0x69,0x00,0x00,0x00] |
| |
| v_rsq_bf16_e64 v5, vcc_lo |
| // GFX1250: v_rsq_bf16_e64 v5, vcc_lo ; encoding: [0x05,0x00,0xfb,0xd5,0x6a,0x00,0x00,0x00] |
| |
| v_rsq_bf16_e64 v5, vcc_hi |
| // GFX1250: v_rsq_bf16_e64 v5, vcc_hi ; encoding: [0x05,0x00,0xfb,0xd5,0x6b,0x00,0x00,0x00] |
| |
| v_rsq_bf16_e64 v5, ttmp15 |
| // GFX1250: v_rsq_bf16_e64 v5, ttmp15 ; encoding: [0x05,0x00,0xfb,0xd5,0x7b,0x00,0x00,0x00] |
| |
| v_rsq_bf16_e64 v5, m0 |
| // GFX1250: v_rsq_bf16_e64 v5, m0 ; encoding: [0x05,0x00,0xfb,0xd5,0x7d,0x00,0x00,0x00] |
| |
| v_rsq_bf16_e64 v5, exec_lo |
| // GFX1250: v_rsq_bf16_e64 v5, exec_lo ; encoding: [0x05,0x00,0xfb,0xd5,0x7e,0x00,0x00,0x00] |
| |
| v_rsq_bf16_e64 v5, exec_hi |
| // GFX1250: v_rsq_bf16_e64 v5, exec_hi ; encoding: [0x05,0x00,0xfb,0xd5,0x7f,0x00,0x00,0x00] |
| |
| v_rsq_bf16_e64 v5, null |
| // GFX1250: v_rsq_bf16_e64 v5, null ; encoding: [0x05,0x00,0xfb,0xd5,0x7c,0x00,0x00,0x00] |
| |
| v_rsq_bf16_e64 v5, -1 |
| // GFX1250: v_rsq_bf16_e64 v5, -1 ; encoding: [0x05,0x00,0xfb,0xd5,0xc1,0x00,0x00,0x00] |
| |
| v_rsq_bf16_e64 v5, 0.5 mul:2 |
| // GFX1250: v_rsq_bf16_e64 v5, 0.5 mul:2 ; encoding: [0x05,0x00,0xfb,0xd5,0xf0,0x00,0x00,0x08] |
| |
| v_rsq_bf16_e64 v5, src_scc mul:4 |
| // GFX1250: v_rsq_bf16_e64 v5, src_scc mul:4 ; encoding: [0x05,0x00,0xfb,0xd5,0xfd,0x00,0x00,0x10] |
| |
| v_rsq_bf16_e64 v255, -|0x8000| clamp div:2 |
| // GFX1250: v_rsq_bf16_e64 v255, -|0x8000| clamp div:2 ; encoding: [0xff,0x81,0xfb,0xd5,0xff,0x00,0x00,0x38,0x00,0x80,0x00,0x00] |
| |
| v_rsq_bf16 v5.h, v128.h |
| // GFX1250: v_rsq_bf16_e64 v5.h, v128.h op_sel:[1,1] ; encoding: [0x05,0x48,0xfb,0xd5,0x80,0x01,0x00,0x00] |
| |
| v_log_bf16_e64 v5, v1 |
| // GFX1250: v_log_bf16_e64 v5, v1 ; encoding: [0x05,0x00,0xfc,0xd5,0x01,0x01,0x00,0x00] |
| |
| v_log_bf16_e64 v5, v255 |
| // GFX1250: v_log_bf16_e64 v5, v255 ; encoding: [0x05,0x00,0xfc,0xd5,0xff,0x01,0x00,0x00] |
| |
| v_log_bf16_e64 v5, s1 |
| // GFX1250: v_log_bf16_e64 v5, s1 ; encoding: [0x05,0x00,0xfc,0xd5,0x01,0x00,0x00,0x00] |
| |
| v_log_bf16_e64 v5, s105 |
| // GFX1250: v_log_bf16_e64 v5, s105 ; encoding: [0x05,0x00,0xfc,0xd5,0x69,0x00,0x00,0x00] |
| |
| v_log_bf16_e64 v5, vcc_lo |
| // GFX1250: v_log_bf16_e64 v5, vcc_lo ; encoding: [0x05,0x00,0xfc,0xd5,0x6a,0x00,0x00,0x00] |
| |
| v_log_bf16_e64 v5, vcc_hi |
| // GFX1250: v_log_bf16_e64 v5, vcc_hi ; encoding: [0x05,0x00,0xfc,0xd5,0x6b,0x00,0x00,0x00] |
| |
| v_log_bf16_e64 v5, ttmp15 |
| // GFX1250: v_log_bf16_e64 v5, ttmp15 ; encoding: [0x05,0x00,0xfc,0xd5,0x7b,0x00,0x00,0x00] |
| |
| v_log_bf16_e64 v5, m0 |
| // GFX1250: v_log_bf16_e64 v5, m0 ; encoding: [0x05,0x00,0xfc,0xd5,0x7d,0x00,0x00,0x00] |
| |
| v_log_bf16_e64 v5, exec_lo |
| // GFX1250: v_log_bf16_e64 v5, exec_lo ; encoding: [0x05,0x00,0xfc,0xd5,0x7e,0x00,0x00,0x00] |
| |
| v_log_bf16_e64 v5, exec_hi |
| // GFX1250: v_log_bf16_e64 v5, exec_hi ; encoding: [0x05,0x00,0xfc,0xd5,0x7f,0x00,0x00,0x00] |
| |
| v_log_bf16_e64 v5, null |
| // GFX1250: v_log_bf16_e64 v5, null ; encoding: [0x05,0x00,0xfc,0xd5,0x7c,0x00,0x00,0x00] |
| |
| v_log_bf16_e64 v5, -1 |
| // GFX1250: v_log_bf16_e64 v5, -1 ; encoding: [0x05,0x00,0xfc,0xd5,0xc1,0x00,0x00,0x00] |
| |
| v_log_bf16_e64 v5, 0.5 mul:2 |
| // GFX1250: v_log_bf16_e64 v5, 0.5 mul:2 ; encoding: [0x05,0x00,0xfc,0xd5,0xf0,0x00,0x00,0x08] |
| |
| v_log_bf16_e64 v5, src_scc mul:4 |
| // GFX1250: v_log_bf16_e64 v5, src_scc mul:4 ; encoding: [0x05,0x00,0xfc,0xd5,0xfd,0x00,0x00,0x10] |
| |
| v_log_bf16_e64 v255, -|0x8000| clamp div:2 |
| // GFX1250: v_log_bf16_e64 v255, -|0x8000| clamp div:2 ; encoding: [0xff,0x81,0xfc,0xd5,0xff,0x00,0x00,0x38,0x00,0x80,0x00,0x00] |
| |
| v_log_bf16 v5.h, v128.h |
| // GFX1250: v_log_bf16_e64 v5.h, v128.h op_sel:[1,1] ; encoding: [0x05,0x48,0xfc,0xd5,0x80,0x01,0x00,0x00] |
| |
| v_cvt_f32_bf16_e64 v5, v1 |
| // GFX1250: v_cvt_f32_bf16_e64 v5, v1 ; encoding: [0x05,0x00,0xf2,0xd5,0x01,0x01,0x00,0x00] |
| |
| v_cvt_f32_bf16_e64 v5, v255 |
| // GFX1250: v_cvt_f32_bf16_e64 v5, v255 ; encoding: [0x05,0x00,0xf2,0xd5,0xff,0x01,0x00,0x00] |
| |
| v_cvt_f32_bf16_e64 v5, s1 |
| // GFX1250: v_cvt_f32_bf16_e64 v5, s1 ; encoding: [0x05,0x00,0xf2,0xd5,0x01,0x00,0x00,0x00] |
| |
| v_cvt_f32_bf16_e64 v5, s105 |
| // GFX1250: v_cvt_f32_bf16_e64 v5, s105 ; encoding: [0x05,0x00,0xf2,0xd5,0x69,0x00,0x00,0x00] |
| |
| v_cvt_f32_bf16_e64 v5, vcc_lo |
| // GFX1250: v_cvt_f32_bf16_e64 v5, vcc_lo ; encoding: [0x05,0x00,0xf2,0xd5,0x6a,0x00,0x00,0x00] |
| |
| v_cvt_f32_bf16_e64 v5, vcc_hi |
| // GFX1250: v_cvt_f32_bf16_e64 v5, vcc_hi ; encoding: [0x05,0x00,0xf2,0xd5,0x6b,0x00,0x00,0x00] |
| |
| v_cvt_f32_bf16_e64 v5, ttmp15 |
| // GFX1250: v_cvt_f32_bf16_e64 v5, ttmp15 ; encoding: [0x05,0x00,0xf2,0xd5,0x7b,0x00,0x00,0x00] |
| |
| v_cvt_f32_bf16_e64 v5, m0 |
| // GFX1250: v_cvt_f32_bf16_e64 v5, m0 ; encoding: [0x05,0x00,0xf2,0xd5,0x7d,0x00,0x00,0x00] |
| |
| v_cvt_f32_bf16_e64 v5, exec_lo |
| // GFX1250: v_cvt_f32_bf16_e64 v5, exec_lo ; encoding: [0x05,0x00,0xf2,0xd5,0x7e,0x00,0x00,0x00] |
| |
| v_cvt_f32_bf16_e64 v5, exec_hi |
| // GFX1250: v_cvt_f32_bf16_e64 v5, exec_hi ; encoding: [0x05,0x00,0xf2,0xd5,0x7f,0x00,0x00,0x00] |
| |
| v_cvt_f32_bf16_e64 v5, null |
| // GFX1250: v_cvt_f32_bf16_e64 v5, null ; encoding: [0x05,0x00,0xf2,0xd5,0x7c,0x00,0x00,0x00] |
| |
| v_cvt_f32_bf16_e64 v5, -1 |
| // GFX1250: v_cvt_f32_bf16_e64 v5, -1 ; encoding: [0x05,0x00,0xf2,0xd5,0xc1,0x00,0x00,0x00] |
| |
| v_cvt_f32_bf16_e64 v5, v1 op_sel:[1] |
| // GFX1250: v_cvt_f32_bf16_e64 v5, v1 op_sel:[1,0] ; encoding: [0x05,0x08,0xf2,0xd5,0x01,0x01,0x00,0x00] |
| |
| v_cvt_f32_bf16_e64 v5, v255 op_sel:[1] |
| // GFX1250: v_cvt_f32_bf16_e64 v5, v255 op_sel:[1,0] ; encoding: [0x05,0x08,0xf2,0xd5,0xff,0x01,0x00,0x00] |
| |
| v_cvt_f32_bf16_e64 v5, s1 op_sel:[1] |
| // GFX1250: v_cvt_f32_bf16_e64 v5, s1 op_sel:[1,0] ; encoding: [0x05,0x08,0xf2,0xd5,0x01,0x00,0x00,0x00] |
| |
| v_cvt_f32_bf16_e64 v5, s105 op_sel:[1] |
| // GFX1250: v_cvt_f32_bf16_e64 v5, s105 op_sel:[1,0] ; encoding: [0x05,0x08,0xf2,0xd5,0x69,0x00,0x00,0x00] |
| |
| v_cvt_f32_bf16_e64 v5, vcc_lo op_sel:[1] |
| // GFX1250: v_cvt_f32_bf16_e64 v5, vcc_lo op_sel:[1,0] ; encoding: [0x05,0x08,0xf2,0xd5,0x6a,0x00,0x00,0x00] |
| |
| v_cvt_f32_bf16_e64 v5, vcc_hi op_sel:[1] |
| // GFX1250: v_cvt_f32_bf16_e64 v5, vcc_hi op_sel:[1,0] ; encoding: [0x05,0x08,0xf2,0xd5,0x6b,0x00,0x00,0x00] |
| |
| v_cvt_f32_bf16_e64 v5, ttmp15 op_sel:[1] |
| // GFX1250: v_cvt_f32_bf16_e64 v5, ttmp15 op_sel:[1,0] ; encoding: [0x05,0x08,0xf2,0xd5,0x7b,0x00,0x00,0x00] |
| |
| v_cvt_f32_bf16_e64 v5, m0 op_sel:[1] |
| // GFX1250: v_cvt_f32_bf16_e64 v5, m0 op_sel:[1,0] ; encoding: [0x05,0x08,0xf2,0xd5,0x7d,0x00,0x00,0x00] |
| |
| v_cvt_f32_bf16_e64 v5, exec_lo op_sel:[1] |
| // GFX1250: v_cvt_f32_bf16_e64 v5, exec_lo op_sel:[1,0] ; encoding: [0x05,0x08,0xf2,0xd5,0x7e,0x00,0x00,0x00] |
| |
| v_cvt_f32_bf16_e64 v5, exec_hi op_sel:[1] |
| // GFX1250: v_cvt_f32_bf16_e64 v5, exec_hi op_sel:[1,0] ; encoding: [0x05,0x08,0xf2,0xd5,0x7f,0x00,0x00,0x00] |
| |
| v_cvt_f32_bf16_e64 v5, null op_sel:[1] |
| // GFX1250: v_cvt_f32_bf16_e64 v5, null op_sel:[1,0] ; encoding: [0x05,0x08,0xf2,0xd5,0x7c,0x00,0x00,0x00] |
| |
| v_cvt_f32_bf16_e64 v5, -1 op_sel:[1] |
| // GFX1250: v_cvt_f32_bf16_e64 v5, -1 op_sel:[1,0] ; encoding: [0x05,0x08,0xf2,0xd5,0xc1,0x00,0x00,0x00] |
| |
| v_cvt_f32_bf16_e64 v5, src_scc op_sel:[1] |
| // GFX1250: v_cvt_f32_bf16_e64 v5, src_scc op_sel:[1,0] ; encoding: [0x05,0x08,0xf2,0xd5,0xfd,0x00,0x00,0x00] |
| |
| v_cvt_f32_bf16_e64 v5, v128.h |
| // GFX1250: v_cvt_f32_bf16_e64 v5, v128.h op_sel:[1,0] ; encoding: [0x05,0x08,0xf2,0xd5,0x80,0x01,0x00,0x00] |
| |
| v_cvt_f16_bf8 v150.l, v2 |
| // GFX1250: v_cvt_f16_bf8_e64 v150.l, v2 ; encoding: [0x96,0x00,0xf8,0xd5,0x02,0x01,0x00,0x00] |
| |
| v_cvt_f16_bf8 v150.l, s2 |
| // GFX1250: v_cvt_f16_bf8_e64 v150.l, s2 ; encoding: [0x96,0x00,0xf8,0xd5,0x02,0x00,0x00,0x00] |
| |
| v_cvt_f16_bf8 v150.l, 2 |
| // GFX1250: v_cvt_f16_bf8_e64 v150.l, 2 ; encoding: [0x96,0x00,0xf8,0xd5,0x82,0x00,0x00,0x00] |
| |
| v_cvt_f16_bf8 v150.l, 0x1234 |
| // GFX1250: v_cvt_f16_bf8_e64 v150.l, 0x1234 ; encoding: [0x96,0x00,0xf8,0xd5,0xff,0x00,0x00,0x00,0x34,0x12,0x00,0x00] |
| |
| v_cvt_f16_bf8 v1.l, v2 byte_sel:2 |
| // GFX1250: v_cvt_f16_bf8_e64 v1.l, v2 byte_sel:2 ; encoding: [0x01,0x08,0xf8,0xd5,0x02,0x01,0x00,0x00] |
| |
| v_cvt_f16_bf8 v1.l, v2 byte_sel:1 |
| // GFX1250: v_cvt_f16_bf8_e64 v1.l, v2 byte_sel:1 ; encoding: [0x01,0x10,0xf8,0xd5,0x02,0x01,0x00,0x00] |
| |
| v_cvt_f16_bf8 v1.l, v2 byte_sel:3 |
| // GFX1250: v_cvt_f16_bf8_e64 v1.l, v2 byte_sel:3 ; encoding: [0x01,0x18,0xf8,0xd5,0x02,0x01,0x00,0x00] |
| |
| v_cvt_f16_bf8 v128.h, v2 |
| // GFX1250: v_cvt_f16_bf8_e64 v128.h, v2 op_sel:[0,1] ; encoding: [0x80,0x40,0xf8,0xd5,0x02,0x01,0x00,0x00] |
| |
| v_cvt_f16_bf8 v1.h, v2 byte_sel:2 |
| // GFX1250: v_cvt_f16_bf8_e64 v1.h, v2 op_sel:[0,1] byte_sel:2 ; encoding: [0x01,0x48,0xf8,0xd5,0x02,0x01,0x00,0x00] |
| |
| v_cvt_f16_fp8 v150.l, v2 |
| // GFX1250: v_cvt_f16_fp8_e64 v150.l, v2 ; encoding: [0x96,0x00,0xf7,0xd5,0x02,0x01,0x00,0x00] |
| |
| v_cvt_f16_fp8 v150.l, s2 |
| // GFX1250: v_cvt_f16_fp8_e64 v150.l, s2 ; encoding: [0x96,0x00,0xf7,0xd5,0x02,0x00,0x00,0x00] |
| |
| v_cvt_f16_fp8 v150.l, 2 |
| // GFX1250: v_cvt_f16_fp8_e64 v150.l, 2 ; encoding: [0x96,0x00,0xf7,0xd5,0x82,0x00,0x00,0x00] |
| |
| v_cvt_f16_fp8 v150.l, 0x1234 |
| // GFX1250: v_cvt_f16_fp8_e64 v150.l, 0x1234 ; encoding: [0x96,0x00,0xf7,0xd5,0xff,0x00,0x00,0x00,0x34,0x12,0x00,0x00] |
| |
| v_cvt_f16_fp8 v1.l, v2 byte_sel:2 |
| // GFX1250: v_cvt_f16_fp8_e64 v1.l, v2 byte_sel:2 ; encoding: [0x01,0x08,0xf7,0xd5,0x02,0x01,0x00,0x00] |
| |
| v_cvt_f16_fp8 v1.l, v2 byte_sel:1 |
| // GFX1250: v_cvt_f16_fp8_e64 v1.l, v2 byte_sel:1 ; encoding: [0x01,0x10,0xf7,0xd5,0x02,0x01,0x00,0x00] |
| |
| v_cvt_f16_fp8 v1.l, v2 byte_sel:3 |
| // GFX1250: v_cvt_f16_fp8_e64 v1.l, v2 byte_sel:3 ; encoding: [0x01,0x18,0xf7,0xd5,0x02,0x01,0x00,0x00] |
| |
| v_cvt_f16_fp8 v128.h, v2 |
| // GFX1250: v_cvt_f16_fp8_e64 v128.h, v2 op_sel:[0,1] ; encoding: [0x80,0x40,0xf7,0xd5,0x02,0x01,0x00,0x00] |
| |
| v_cvt_f16_fp8 v1.h, v2 byte_sel:2 |
| // GFX1250: v_cvt_f16_fp8_e64 v1.h, v2 op_sel:[0,1] byte_sel:2 ; encoding: [0x01,0x48,0xf7,0xd5,0x02,0x01,0x00,0x00] |
| |
| v_cvt_pk_f16_bf8 v1, v150 |
| // GFX1250: v_cvt_pk_f16_bf8 v1, v150 ; encoding: [0x01,0x00,0xf6,0xd5,0x96,0x01,0x00,0x00] |
| |
| v_cvt_pk_f16_bf8 v1, v2 op_sel:[1] |
| // GFX1250: v_cvt_pk_f16_bf8 v1, v2 op_sel:[1,0] ; encoding: [0x01,0x08,0xf6,0xd5,0x02,0x01,0x00,0x00] |
| |
| v_cvt_pk_f16_bf8 v1, v150 op_sel:[1] |
| // GFX1250: v_cvt_pk_f16_bf8 v1, v150 op_sel:[1,0] ; encoding: [0x01,0x08,0xf6,0xd5,0x96,0x01,0x00,0x00] |
| |
| v_cvt_pk_f16_bf8 v1, s2 op_sel:[1] |
| // GFX1250: v_cvt_pk_f16_bf8 v1, s2 op_sel:[1,0] ; encoding: [0x01,0x08,0xf6,0xd5,0x02,0x00,0x00,0x00] |
| |
| v_cvt_pk_f16_fp8 v1, v150 |
| // GFX1250: v_cvt_pk_f16_fp8 v1, v150 ; encoding: [0x01,0x00,0xf5,0xd5,0x96,0x01,0x00,0x00] |
| |
| v_cvt_pk_f16_fp8 v1, v2 op_sel:[1] |
| // GFX1250: v_cvt_pk_f16_fp8 v1, v2 op_sel:[1,0] ; encoding: [0x01,0x08,0xf5,0xd5,0x02,0x01,0x00,0x00] |
| |
| v_cvt_pk_f16_fp8 v1, v150 op_sel:[1] |
| // GFX1250: v_cvt_pk_f16_fp8 v1, v150 op_sel:[1,0] ; encoding: [0x01,0x08,0xf5,0xd5,0x96,0x01,0x00,0x00] |
| |
| v_cvt_pk_f16_fp8 v1, s2 op_sel:[1] |
| // GFX1250: v_cvt_pk_f16_fp8 v1, s2 op_sel:[1,0] ; encoding: [0x01,0x08,0xf5,0xd5,0x02,0x00,0x00,0x00] |