From 37bf3bb49d2f63e65e040f13271efb344fd96144 Mon Sep 17 00:00:00 2001 From: MITSUNARI Shigeo Date: Thu, 9 Sep 2021 10:53:20 +0900 Subject: [PATCH] add vscalefsh --- gen/gen_avx512.cpp | 1 + test/misc.cpp | 6 ++++++ xbyak/xbyak_mnemonic.h | 1 + 3 files changed, 8 insertions(+) diff --git a/gen/gen_avx512.cpp b/gen/gen_avx512.cpp index edc0571..cd223ae 100644 --- a/gen/gen_avx512.cpp +++ b/gen/gen_avx512.cpp @@ -348,6 +348,7 @@ void putX_X_XM_IMM() { 0x2D, "vscalefss", T_66 | T_0F38 | T_MUST_EVEX | T_EW0 | T_ER_X | T_N4, false }, { 0x2C, "vscalefph", T_66 | T_MAP6 | T_YMM | T_MUST_EVEX | T_EW0 | T_B16 | T_ER_Z, false }, + { 0x2D, "vscalefsh", T_66 | T_MAP6 | T_MUST_EVEX | T_EW0 | T_ER_X | T_N2, false }, { 0x42, "vdbpsadbw", T_66 | T_0F3A | T_YMM | T_MUST_EVEX | T_EW0, true }, { 0x83, "vpmultishiftqb", T_66 | T_0F38 | T_YMM | T_MUST_EVEX | T_EW1 | T_B64, false }, diff --git a/test/misc.cpp b/test/misc.cpp index 665af2a..98dc8c5 100644 --- a/test/misc.cpp +++ b/test/misc.cpp @@ -1003,6 +1003,8 @@ CYBOZU_TEST_AUTO(vaddph) vscalefph(zmm1, zmm5, ptr_b [rax+0x40]); vscalefph(zmm1|k1|T_z|T_rd_sae, zmm5, zmm7); + vscalefsh(xmm1, xmm5, ptr [rax+0x40]); + vscalefsh(xmm1|k1|T_z|T_rd_sae, xmm5, xmm7); @@ -1170,6 +1172,10 @@ CYBOZU_TEST_AUTO(vaddph) 0x62, 0xf6, 0x55, 0x48, 0x2c, 0x48, 0x01, 0x62, 0xf6, 0x55, 0x58, 0x2c, 0x48, 0x20, 0x62, 0xf6, 0x55, 0xb9, 0x2c, 0xcf, + + // vscalefsh + 0x62, 0xf6, 0x55, 0x08, 0x2d, 0x48, 0x20, + 0x62, 0xf6, 0x55, 0xb9, 0x2d, 0xcf, }; const size_t n = sizeof(tbl) / sizeof(tbl[0]); CYBOZU_TEST_EQUAL(c.getSize(), n); diff --git a/xbyak/xbyak_mnemonic.h b/xbyak/xbyak_mnemonic.h index a94a1a5..a9966ae 100644 --- a/xbyak/xbyak_mnemonic.h +++ b/xbyak/xbyak_mnemonic.h @@ -2207,6 +2207,7 @@ void vscalefpd(const Xmm& x1, const Xmm& x2, const Operand& op) { opAVX_X_X_XM(x void vscalefph(const Xmm& x1, const Xmm& x2, const Operand& op) { opAVX_X_X_XM(x1, x2, op, T_66 | T_MAP6 | T_EW0 | T_YMM | T_ER_Z | T_MUST_EVEX | T_B16, 0x2C); } void vscalefps(const Xmm& x1, const Xmm& x2, const Operand& op) { opAVX_X_X_XM(x1, x2, op, T_66 | T_0F38 | T_EW0 | T_YMM | T_ER_Z | T_MUST_EVEX | T_B32, 0x2C); } void vscalefsd(const Xmm& x1, const Xmm& x2, const Operand& op) { opAVX_X_X_XM(x1, x2, op, T_N8 | T_66 | T_0F38 | T_EW1 | T_ER_X | T_MUST_EVEX, 0x2D); } +void vscalefsh(const Xmm& x1, const Xmm& x2, const Operand& op) { opAVX_X_X_XM(x1, x2, op, T_N2 | T_66 | T_MAP6 | T_EW0 | T_ER_X | T_MUST_EVEX, 0x2D); } void vscalefss(const Xmm& x1, const Xmm& x2, const Operand& op) { opAVX_X_X_XM(x1, x2, op, T_N4 | T_66 | T_0F38 | T_EW0 | T_ER_X | T_MUST_EVEX, 0x2D); } void vscatterdpd(const Address& addr, const Xmm& x) { opGather2(x, addr, T_N8 | T_66 | T_0F38 | T_EW1 | T_YMM | T_MUST_EVEX | T_M_K | T_VSIB, 0xA2, 1); } void vscatterdps(const Address& addr, const Xmm& x) { opGather2(x, addr, T_N4 | T_66 | T_0F38 | T_EW0 | T_YMM | T_MUST_EVEX | T_M_K | T_VSIB, 0xA2, 0); }