diff --git a/gen/gen_avx512.cpp b/gen/gen_avx512.cpp index b45e753..2c1f663 100644 --- a/gen/gen_avx512.cpp +++ b/gen/gen_avx512.cpp @@ -107,7 +107,7 @@ void putVcmp() { 0xC2, "vcmpps", T_0F | T_MUST_EVEX | T_EW0 | T_SAE_Z | T_YMM | T_B32, true }, { 0xC2, "vcmpsd", T_0F | T_MUST_EVEX | T_EW1 | T_SAE_Z | T_F2 | T_N8, true }, { 0xC2, "vcmpss", T_0F | T_MUST_EVEX | T_EW0 | T_SAE_Z | T_F3 | T_N4, true }, - { 0xC2, "vcmpph", T_0F3A | T_MUST_EVEX | T_EW0 | T_SAE_Z | T_YMM | T_B32, true }, + { 0xC2, "vcmpph", T_0F3A | T_MUST_EVEX | T_EW0 | T_SAE_Z | T_YMM | T_B16, true }, { 0xC2, "vcmpsh", T_0F3A | T_MUST_EVEX | T_EW0 | T_SAE_X, true }, { 0x74, "vpcmpeqb", T_66 | T_0F | T_MUST_EVEX | T_YMM, false }, diff --git a/test/misc.cpp b/test/misc.cpp index 1c6e8ca..38a4679 100644 --- a/test/misc.cpp +++ b/test/misc.cpp @@ -881,6 +881,13 @@ CYBOZU_TEST_AUTO(vaddph) vaddsh(xmm0, xmm15, ptr[rax+64]); vaddsh(xmm0|k5|T_z|T_rd_sae, xmm15, xmm3); + + vcmpph(k1, xm15, ptr[rax+64], 1); + vcmpph(k2, ym15, ptr[rax+64], 2); + vcmpph(k3, zm15, ptr[rax+64], 3); + vcmpph(k1, xm15, ptr_b[rax+64], 1); + vcmpph(k2, ym15, ptr_b[rax+64], 2); + vcmpph(k3, zm15, ptr_b[rax+64], 3); } } c; const uint8_t tbl[] = { @@ -894,6 +901,13 @@ CYBOZU_TEST_AUTO(vaddph) 0x62, 0xF5, 0x06, 0x08, 0x58, 0x40, 0x20, 0x62, 0xF5, 0x06, 0xBD, 0x58, 0xC3, + + 0x62, 0xf3, 0x04, 0x08, 0xc2, 0x48, 0x04, 0x01, + 0x62, 0xf3, 0x04, 0x28, 0xc2, 0x50, 0x02, 0x02, + 0x62, 0xf3, 0x04, 0x48, 0xc2, 0x58, 0x01, 0x03, + 0x62, 0xf3, 0x04, 0x18, 0xc2, 0x48, 0x20, 0x01, + 0x62, 0xf3, 0x04, 0x38, 0xc2, 0x50, 0x20, 0x02, + 0x62, 0xf3, 0x04, 0x58, 0xc2, 0x58, 0x20, 0x03, }; const size_t n = sizeof(tbl) / sizeof(tbl[0]); CYBOZU_TEST_EQUAL(c.getSize(), n); diff --git a/xbyak/xbyak_mnemonic.h b/xbyak/xbyak_mnemonic.h index cc1ff53..ae5bce0 100644 --- a/xbyak/xbyak_mnemonic.h +++ b/xbyak/xbyak_mnemonic.h @@ -1870,7 +1870,7 @@ void vcmpordps(const Opmask& k, const Xmm& x, const Operand& op) { vcmpps(k, x, void vcmpordsd(const Opmask& k, const Xmm& x, const Operand& op) { vcmpsd(k, x, op, 7); } void vcmpordss(const Opmask& k, const Xmm& x, const Operand& op) { vcmpss(k, x, op, 7); } void vcmppd(const Opmask& k, const Xmm& x, const Operand& op, uint8_t imm) { opAVX_K_X_XM(k, x, op, T_66 | T_0F | T_EW1 | T_YMM | T_SAE_Z | T_MUST_EVEX | T_B64, 0xC2, imm); } -void vcmpph(const Opmask& k, const Xmm& x, const Operand& op, uint8_t imm) { opAVX_K_X_XM(k, x, op, T_0F3A | T_EW0 | T_YMM | T_SAE_Z | T_MUST_EVEX | T_B32, 0xC2, imm); } +void vcmpph(const Opmask& k, const Xmm& x, const Operand& op, uint8_t imm) { opAVX_K_X_XM(k, x, op, T_0F3A | T_EW0 | T_YMM | T_SAE_Z | T_MUST_EVEX | T_B16, 0xC2, imm); } void vcmpps(const Opmask& k, const Xmm& x, const Operand& op, uint8_t imm) { opAVX_K_X_XM(k, x, op, T_0F | T_EW0 | T_YMM | T_SAE_Z | T_MUST_EVEX | T_B32, 0xC2, imm); } void vcmpsd(const Opmask& k, const Xmm& x, const Operand& op, uint8_t imm) { opAVX_K_X_XM(k, x, op, T_N8 | T_F2 | T_0F | T_EW1 | T_SAE_Z | T_MUST_EVEX, 0xC2, imm); } void vcmpsh(const Opmask& k, const Xmm& x, const Operand& op, uint8_t imm) { opAVX_K_X_XM(k, x, op, T_0F3A | T_EW0 | T_SAE_X | T_MUST_EVEX, 0xC2, imm); }