add vcmpph
diff --git a/gen/gen_avx512.cpp b/gen/gen_avx512.cpp
index 0a8eb13..c4f495e 100644
--- a/gen/gen_avx512.cpp
+++ b/gen/gen_avx512.cpp
@@ -107,6 +107,7 @@
 		{ 0xC2, "vcmpps", T_0F | T_MUST_EVEX | T_EW0 | T_SAE_Z | T_YMM | T_B32, true },
 		{ 0xC2, "vcmpsd", T_0F | T_MUST_EVEX | T_EW1 | T_SAE_Z | T_F2 | T_N8, true },
 		{ 0xC2, "vcmpss", T_0F | T_MUST_EVEX | T_EW0 | T_SAE_Z | T_F3 | T_N4, true },
+		{ 0xC2, "vcmpph", T_0F3A | T_MUST_EVEX | T_EW0 | T_SAE_Z | T_YMM | T_B32, true },
 
 		{ 0x74, "vpcmpeqb", T_66 | T_0F | T_MUST_EVEX | T_YMM, false },
 		{ 0x75, "vpcmpeqw", T_66 | T_0F | T_MUST_EVEX | T_YMM, false },
diff --git a/test/misc.cpp b/test/misc.cpp
index 77d7361..8e65712 100644
--- a/test/misc.cpp
+++ b/test/misc.cpp
@@ -866,7 +866,7 @@
 	CYBOZU_TEST_EXCEPTION(c.badVex(), std::exception);
 }
 
-CYBOZU_TEST_AUTO(vaddph)
+CYBOZU_TEST_AUTO(fp16)
 {
 	struct Code : Xbyak::CodeGenerator {
 		Code()
@@ -875,6 +875,10 @@
 			vaddph(ymm0, ymm1, ptr[rax+64]);
 			vaddph(xmm0, xmm1, ptr[rax+64]);
 			vaddsh(xmm0, xmm15, ptr[rax+64]);
+
+			vcmpph(k1, xm15, ptr[rax+64], 1);
+			vcmpph(k2, ym15, ptr[rax+64], 2);
+			vcmpph(k3, zm15, ptr[rax+64], 3);
 		}
 	} c;
 	const uint8_t tbl[] = {
@@ -882,6 +886,10 @@
 		0x62, 0xF5, 0x74, 0x28, 0x58, 0x40, 0x02,
 		0x62, 0xF5, 0x74, 0x08, 0x58, 0x40, 0x04,
 		0x62, 0xF5, 0x06, 0x08, 0x58, 0x40, 0x20,
+
+		0x62, 0xF3, 0x04, 0x08, 0xC2, 0x48, 0x04, 0x01,
+		0x62, 0xF3, 0x04, 0x28, 0xC2, 0x50, 0x02, 0x02,
+		0x62, 0xF3, 0x04, 0x48, 0xC2, 0x58, 0x01, 0x03,
 	};
 	const size_t n = sizeof(tbl) / sizeof(tbl[0]);
 	CYBOZU_TEST_EQUAL(c.getSize(), n);
diff --git a/xbyak/xbyak_mnemonic.h b/xbyak/xbyak_mnemonic.h
index f28dcbe..a3a6459 100644
--- a/xbyak/xbyak_mnemonic.h
+++ b/xbyak/xbyak_mnemonic.h
@@ -1870,6 +1870,7 @@
 void vcmpordsd(const Opmask& k, const Xmm& x, const Operand& op) { vcmpsd(k, x, op, 7); }
 void vcmpordss(const Opmask& k, const Xmm& x, const Operand& op) { vcmpss(k, x, op, 7); }
 void vcmppd(const Opmask& k, const Xmm& x, const Operand& op, uint8_t imm) { opAVX_K_X_XM(k, x, op, T_66 | T_0F | T_EW1 | T_YMM | T_SAE_Z | T_MUST_EVEX | T_B64, 0xC2, imm); }
+void vcmpph(const Opmask& k, const Xmm& x, const Operand& op, uint8_t imm) { opAVX_K_X_XM(k, x, op, T_0F3A | T_EW0 | T_YMM | T_SAE_Z | T_MUST_EVEX | T_B32, 0xC2, imm); }
 void vcmpps(const Opmask& k, const Xmm& x, const Operand& op, uint8_t imm) { opAVX_K_X_XM(k, x, op, T_0F | T_EW0 | T_YMM | T_SAE_Z | T_MUST_EVEX | T_B32, 0xC2, imm); }
 void vcmpsd(const Opmask& k, const Xmm& x, const Operand& op, uint8_t imm) { opAVX_K_X_XM(k, x, op, T_N8 | T_F2 | T_0F | T_EW1 | T_SAE_Z | T_MUST_EVEX, 0xC2, imm); }
 void vcmpss(const Opmask& k, const Xmm& x, const Operand& op, uint8_t imm) { opAVX_K_X_XM(k, x, op, T_N4 | T_F3 | T_0F | T_EW0 | T_SAE_Z | T_MUST_EVEX, 0xC2, imm); }