From 1b9ba2b2333746c5e2b05a2bf24fa6ec3828dcdf Mon Sep 17 00:00:00 2001 From: Andrzej Janik Date: Sat, 27 Feb 2021 20:55:19 +0100 Subject: Nobody expects the Red Team Too many changes to list, but broadly: * Remove Intel GPU support from the compiler * Add AMD GPU support to the compiler * Remove Intel GPU host code * Add AMD GPU host code * More device instructions. From 40 to 68 * More host functions. From 48 to 184 * Add proof of concept implementation of OptiX framework * Add minimal support of cuDNN, cuBLAS, cuSPARSE, cuFFT, NCCL, NVML * Improve ZLUDA launcher for Windows --- ptx/src/test/spirv_run/bfind.ptx | 27 +++++++++++++++++++++++++++ 1 file changed, 27 insertions(+) create mode 100644 ptx/src/test/spirv_run/bfind.ptx (limited to 'ptx/src/test/spirv_run/bfind.ptx') diff --git a/ptx/src/test/spirv_run/bfind.ptx b/ptx/src/test/spirv_run/bfind.ptx new file mode 100644 index 0000000..a49fce3 --- /dev/null +++ b/ptx/src/test/spirv_run/bfind.ptx @@ -0,0 +1,27 @@ +.version 6.5 +.target sm_30 +.address_size 64 + +.visible .entry bfind( + .param .u64 input, + .param .u64 output +) +{ + .reg .u64 in_addr; + .reg .u64 out_addr; + .reg .u32 temp<6>; + + ld.param.u64 in_addr, [input]; + ld.param.u64 out_addr, [output]; + + ld.u32 temp0, [in_addr]; + ld.u32 temp1, [in_addr+4]; + ld.u32 temp2, [in_addr+8]; + bfind.u32 temp3, temp0; + bfind.u32 temp4, temp1; + bfind.u32 temp5, temp2; + st.u32 [out_addr], temp3; + st.u32 [out_addr+4], temp4; + st.u32 [out_addr+8], temp5; + ret; +} -- cgit v1.2.3