diff --git a/gen/gen_avx512.cpp b/gen/gen_avx512.cpp index 36a9697..856534d 100644 --- a/gen/gen_avx512.cpp +++ b/gen/gen_avx512.cpp @@ -341,6 +341,7 @@ void putX_X_XM_IMM() { 0x0B, "vrndscalesd", T_66 | T_0F3A | T_MUST_EVEX | T_EW1 | T_N8, true }, { 0x0A, "vrndscaless", T_66 | T_0F3A | T_MUST_EVEX | T_EW0 | T_N4, true }, + { 0x0A, "vrndscalesh", T_0F3A | T_MUST_EVEX | T_EW0 | T_N2 | T_SAE_X, true }, { 0x2C, "vscalefpd", T_66 | T_0F38 | T_YMM | T_MUST_EVEX | T_EW1 | T_B64 | T_ER_Z, false }, { 0x2C, "vscalefps", T_66 | T_0F38 | T_YMM | T_MUST_EVEX | T_EW0 | T_B32 | T_ER_Z, false }, diff --git a/test/misc.cpp b/test/misc.cpp index 5383e48..7a9786b 100644 --- a/test/misc.cpp +++ b/test/misc.cpp @@ -1025,6 +1025,8 @@ CYBOZU_TEST_AUTO(vaddph) vrndscaleph(zmm1, ptr_b [rax+0x40], 0x6); vrndscaleph(zmm1|k1|T_z|T_sae, zmm5, 0x7); + vrndscalesh(xmm1, xmm3, ptr [rax+0x40], 0x1); + vrndscalesh(xmm1|k1|T_z|T_sae, xmm5, xmm4, 0x2); @@ -1219,7 +1221,9 @@ CYBOZU_TEST_AUTO(vaddph) 0x62, 0xf3, 0x7c, 0x58, 0x08, 0x48, 0x20, 0x06, 0x62, 0xf3, 0x7c, 0x99, 0x08, 0xcd, 0x07, - + // vrndscalesh + 0x62, 0xf3, 0x64, 0x08, 0x0a, 0x48, 0x20, 0x01, + 0x62, 0xf3, 0x54, 0x99, 0x0a, 0xcc, 0x02, }; diff --git a/xbyak/xbyak_mnemonic.h b/xbyak/xbyak_mnemonic.h index 5272a87..d13ef26 100644 --- a/xbyak/xbyak_mnemonic.h +++ b/xbyak/xbyak_mnemonic.h @@ -2195,6 +2195,7 @@ void vrndscalepd(const Xmm& x, const Operand& op, uint8_t imm) { opAVX_X_XM_IMM( void vrndscaleph(const Xmm& x, const Operand& op, uint8_t imm) { opAVX_X_XM_IMM(x, op, T_0F3A | T_EW0 | T_YMM | T_SAE_Z | T_MUST_EVEX | T_B16, 0x08, imm); } void vrndscaleps(const Xmm& x, const Operand& op, uint8_t imm) { opAVX_X_XM_IMM(x, op, T_66 | T_0F3A | T_EW0 | T_YMM | T_MUST_EVEX | T_B32, 0x08, imm); } void vrndscalesd(const Xmm& x1, const Xmm& x2, const Operand& op, uint8_t imm) { opAVX_X_X_XM(x1, x2, op, T_N8 | T_66 | T_0F3A | T_EW1 | T_MUST_EVEX, 0x0B, imm); } +void vrndscalesh(const Xmm& x1, const Xmm& x2, const Operand& op, uint8_t imm) { opAVX_X_X_XM(x1, x2, op, T_N2 | T_0F3A | T_EW0 | T_SAE_X | T_MUST_EVEX, 0x0A, imm); } void vrndscaless(const Xmm& x1, const Xmm& x2, const Operand& op, uint8_t imm) { opAVX_X_X_XM(x1, x2, op, T_N4 | T_66 | T_0F3A | T_EW0 | T_MUST_EVEX, 0x0A, imm); } void vrsqrt14pd(const Xmm& x, const Operand& op) { opAVX_X_XM_IMM(x, op, T_66 | T_0F38 | T_EW1 | T_YMM | T_MUST_EVEX | T_B64, 0x4E); } void vrsqrt14ps(const Xmm& x, const Operand& op) { opAVX_X_XM_IMM(x, op, T_66 | T_0F38 | T_EW0 | T_YMM | T_MUST_EVEX | T_B32, 0x4E); }