diff options
author | MITSUNARI Shigeo <[email protected]> | 2024-10-11 11:50:55 +0900 |
---|---|---|
committer | MITSUNARI Shigeo <[email protected]> | 2024-10-13 13:51:06 +0900 |
commit | 3ca7e64c63daac8c3dd1c3cbafdc26ac011fa6ab (patch) | |
tree | c9f0509a05372e641bc698466064e7e1be1ce20b /test | |
parent | 864fd0c49ce07fc534b16250758987c445bb9c70 (diff) | |
download | xbyak-3ca7e64c63daac8c3dd1c3cbafdc26ac011fa6ab.tar.gz xbyak-3ca7e64c63daac8c3dd1c3cbafdc26ac011fa6ab.zip |
add type of w(x, x, op) in avx10 bf16
Diffstat (limited to 'test')
-rw-r--r-- | test/avx10/bf16.txt | 30 |
1 files changed, 30 insertions, 0 deletions
diff --git a/test/avx10/bf16.txt b/test/avx10/bf16.txt index 1c77f93..d8f4c5a 100644 --- a/test/avx10/bf16.txt +++ b/test/avx10/bf16.txt @@ -2,3 +2,33 @@ vaddnepbf16(xm1, xm2, xm3); vaddnepbf16(ym1|k1, ym2, ptr[rax+128]); vaddnepbf16(ym1|k1, ym2, ptr_b[rax+128]); vaddnepbf16(zm1|k2|T_z, zm2, ptr_b[rax+128]); + +vdivnepbf16(xm1, xm2, xm3); +vdivnepbf16(ym1|k1, ym2, ptr[rax+128]); +vdivnepbf16(ym1|k1, ym2, ptr_b[rax+128]); +vdivnepbf16(zm1|k2|T_z, zm2, ptr_b[rax+128]); + +vmaxpbf16(xm1, xm2, xm3); +vmaxpbf16(ym1|k1, ym2, ptr[rax+128]); +vmaxpbf16(ym1|k1, ym2, ptr_b[rax+128]); +vmaxpbf16(zm1|k2|T_z, zm2, ptr_b[rax+128]); + +vminpbf16(xm1, xm2, xm3); +vminpbf16(ym1|k1, ym2, ptr[rax+128]); +vminpbf16(ym1|k1, ym2, ptr_b[rax+128]); +vminpbf16(zm1|k2|T_z, zm2, ptr_b[rax+128]); + +vmulnepbf16(xm1, xm2, xm3); +vmulnepbf16(ym1|k1, ym2, ptr[rax+128]); +vmulnepbf16(ym1|k1, ym2, ptr_b[rax+128]); +vmulnepbf16(zm1|k2|T_z, zm2, ptr_b[rax+128]); + +vscalefpbf16(xm1, xm2, xm3); +vscalefpbf16(ym1|k1, ym2, ptr[rax+128]); +vscalefpbf16(ym1|k1, ym2, ptr_b[rax+128]); +vscalefpbf16(zm1|k2|T_z, zm2, ptr_b[rax+128]); + +vsubnepbf16(xm1, xm2, xm3); +vsubnepbf16(ym1|k1, ym2, ptr[rax+128]); +vsubnepbf16(ym1|k1, ym2, ptr_b[rax+128]); +vsubnepbf16(zm1|k2|T_z, zm2, ptr_b[rax+128]); |