add detection of movdiri
diff --git a/sample/test_util.cpp b/sample/test_util.cpp
index 27b1cf0..0b5ce57 100644
--- a/sample/test_util.cpp
+++ b/sample/test_util.cpp
@@ -86,6 +86,7 @@
 		{ Cpu::tWAITPKG, "waitpkg" },
 		{ Cpu::tCLFLUSHOPT, "clflushopt" },
 		{ Cpu::tCLDEMOTE, "cldemote" },
+		{ Cpu::tMOVDIRI, "movidiri" },
 	};
 	for (size_t i = 0; i < NUM_OF_ARRAY(tbl); i++) {
 		if (cpu.has(tbl[i].type)) printf(" %s", tbl[i].str);
diff --git a/xbyak/xbyak_util.h b/xbyak/xbyak_util.h
index 68d40f0..546e1a0 100644
--- a/xbyak/xbyak_util.h
+++ b/xbyak/xbyak_util.h
@@ -430,6 +430,7 @@
 	static const Type tAVX_VNNI;
 	static const Type tCLFLUSHOPT;
 	static const Type tCLDEMOTE;
+	static const Type tMOVDIRI;
 
 	CpuT()
 		: type_(NONE)
@@ -553,6 +554,7 @@
 			if (ECX & (1U << 0)) type_ |= tPREFETCHWT1;
 			if (ECX & (1U << 5)) type_ |= tWAITPKG;
 			if (ECX & (1U << 25)) type_ |= tCLDEMOTE;
+			if (ECX & (1U << 27)) type_ |= tMOVDIRI;
 			if (EDX & (1U << 24)) type_ |= tAMX_TILE;
 			if (EDX & (1U << 25)) type_ |= tAMX_INT8;
 			if (EDX & (1U << 22)) type_ |= tAMX_BF16;
@@ -653,6 +655,7 @@
 template<int dummy> const Type CpuT<dummy>::tAVX_VNNI = uint64_t(1) << 62;
 template<int dummy> const Type CpuT<dummy>::tCLFLUSHOPT = Type(1) << 63;
 template<int dummy> const Type CpuT<dummy>::tCLDEMOTE = Type(1) << 64;
+template<int dummy> const Type CpuT<dummy>::tMOVDIRI = Type(1) << 65;
 
 } // local