aboutsummaryrefslogtreecommitdiffhomepage
diff options
context:
space:
mode:
authorMITSUNARI Shigeo <[email protected]>2021-09-09 11:10:37 +0900
committerMITSUNARI Shigeo <[email protected]>2021-09-09 11:10:37 +0900
commit2f14eae85c63281c9a1ce2b6e786924faa4af4ae (patch)
treee679ac872f08f8207d31156141a1346df584973b
parentf96870a44e4c0ee0dd0e42aa1c0b385ca50ed3c6 (diff)
downloadxbyak-2f14eae85c63281c9a1ce2b6e786924faa4af4ae.tar.gz
xbyak-2f14eae85c63281c9a1ce2b6e786924faa4af4ae.zip
add vrndscaleph
-rw-r--r--gen/gen_avx512.cpp1
-rw-r--r--test/misc.cpp21
-rw-r--r--xbyak/xbyak_mnemonic.h1
3 files changed, 23 insertions, 0 deletions
diff --git a/gen/gen_avx512.cpp b/gen/gen_avx512.cpp
index dd7e855..36a9697 100644
--- a/gen/gen_avx512.cpp
+++ b/gen/gen_avx512.cpp
@@ -671,6 +671,7 @@ void putX_XM_IMM()
{ 0x09, "vrndscalepd", T_66 | T_0F3A | T_YMM | T_MUST_EVEX | T_EW1 | T_B64, true },
{ 0x08, "vrndscaleps", T_66 | T_0F3A | T_YMM | T_MUST_EVEX | T_EW0 | T_B32, true },
+ { 0x08, "vrndscaleph", T_0F3A | T_YMM | T_MUST_EVEX | T_EW0 | T_B16 | T_SAE_Z, true },
{ 0xC4, "vpconflictd", T_66 | T_0F38 | T_YMM | T_MUST_EVEX | T_EW0 | T_B32, false },
{ 0xC4, "vpconflictq", T_66 | T_0F38 | T_YMM | T_MUST_EVEX | T_EW1 | T_B64, false },
diff --git a/test/misc.cpp b/test/misc.cpp
index e67225a..5383e48 100644
--- a/test/misc.cpp
+++ b/test/misc.cpp
@@ -1017,6 +1017,14 @@ CYBOZU_TEST_AUTO(vaddph)
vreducesh(xmm1, xmm3, ptr [rax+0x40], 0x1);
vreducesh(xmm1|k1|T_z|T_sae, xmm5, xmm4, 0x2);
+ vrndscaleph(xmm1, ptr [rax+0x40], 0x1);
+ vrndscaleph(xmm1, ptr_b [rax+0x40], 0x2);
+ vrndscaleph(ymm1, ptr [rax+0x40], 0x3);
+ vrndscaleph(ymm1, ptr_b [rax+0x40], 0x4);
+ vrndscaleph(zmm1, ptr [rax+0x40], 0x5);
+ vrndscaleph(zmm1, ptr_b [rax+0x40], 0x6);
+ vrndscaleph(zmm1|k1|T_z|T_sae, zmm5, 0x7);
+
@@ -1201,6 +1209,19 @@ CYBOZU_TEST_AUTO(vaddph)
// vreducesh
0x62, 0xf3, 0x64, 0x08, 0x57, 0x48, 0x20, 0x01,
0x62, 0xf3, 0x54, 0x99, 0x57, 0xcc, 0x02,
+
+ // vrndscaleph
+ 0x62, 0xf3, 0x7c, 0x08, 0x08, 0x48, 0x04, 0x01,
+ 0x62, 0xf3, 0x7c, 0x18, 0x08, 0x48, 0x20, 0x02,
+ 0x62, 0xf3, 0x7c, 0x28, 0x08, 0x48, 0x02, 0x03,
+ 0x62, 0xf3, 0x7c, 0x38, 0x08, 0x48, 0x20, 0x04,
+ 0x62, 0xf3, 0x7c, 0x48, 0x08, 0x48, 0x01, 0x05,
+ 0x62, 0xf3, 0x7c, 0x58, 0x08, 0x48, 0x20, 0x06,
+ 0x62, 0xf3, 0x7c, 0x99, 0x08, 0xcd, 0x07,
+
+
+
+
};
const size_t n = sizeof(tbl) / sizeof(tbl[0]);
CYBOZU_TEST_EQUAL(c.getSize(), n);
diff --git a/xbyak/xbyak_mnemonic.h b/xbyak/xbyak_mnemonic.h
index 0918078..5272a87 100644
--- a/xbyak/xbyak_mnemonic.h
+++ b/xbyak/xbyak_mnemonic.h
@@ -2192,6 +2192,7 @@ void vreducesd(const Xmm& x1, const Xmm& x2, const Operand& op, uint8_t imm) { o
void vreducesh(const Xmm& x1, const Xmm& x2, const Operand& op, uint8_t imm) { opAVX_X_X_XM(x1, x2, op, T_N2 | T_0F3A | T_EW0 | T_SAE_X | T_MUST_EVEX, 0x57, imm); }
void vreducess(const Xmm& x1, const Xmm& x2, const Operand& op, uint8_t imm) { opAVX_X_X_XM(x1, x2, op, T_N4 | T_66 | T_0F3A | T_EW0 | T_SAE_X | T_MUST_EVEX, 0x57, imm); }
void vrndscalepd(const Xmm& x, const Operand& op, uint8_t imm) { opAVX_X_XM_IMM(x, op, T_66 | T_0F3A | T_EW1 | T_YMM | T_MUST_EVEX | T_B64, 0x09, imm); }
+void vrndscaleph(const Xmm& x, const Operand& op, uint8_t imm) { opAVX_X_XM_IMM(x, op, T_0F3A | T_EW0 | T_YMM | T_SAE_Z | T_MUST_EVEX | T_B16, 0x08, imm); }
void vrndscaleps(const Xmm& x, const Operand& op, uint8_t imm) { opAVX_X_XM_IMM(x, op, T_66 | T_0F3A | T_EW0 | T_YMM | T_MUST_EVEX | T_B32, 0x08, imm); }
void vrndscalesd(const Xmm& x1, const Xmm& x2, const Operand& op, uint8_t imm) { opAVX_X_X_XM(x1, x2, op, T_N8 | T_66 | T_0F3A | T_EW1 | T_MUST_EVEX, 0x0B, imm); }
void vrndscaless(const Xmm& x1, const Xmm& x2, const Operand& op, uint8_t imm) { opAVX_X_X_XM(x1, x2, op, T_N4 | T_66 | T_0F3A | T_EW0 | T_MUST_EVEX, 0x0A, imm); }