diff options
Diffstat (limited to 'ptx/src/test/spirv_run/shr_u32.ll')
-rw-r--r-- | ptx/src/test/spirv_run/shr_u32.ll | 30 |
1 files changed, 16 insertions, 14 deletions
diff --git a/ptx/src/test/spirv_run/shr_u32.ll b/ptx/src/test/spirv_run/shr_u32.ll index 22c8761..52153d9 100644 --- a/ptx/src/test/spirv_run/shr_u32.ll +++ b/ptx/src/test/spirv_run/shr_u32.ll @@ -2,9 +2,7 @@ target datalayout = "e-p:64:64-p1:64:64-p2:32:32-p3:32:32-p4:64:64-p5:32:32-p6:3 target triple = "amdgcn-amd-amdhsa" define protected amdgpu_kernel void @shr_u32(ptr addrspace(4) byref(i64) %"36", ptr addrspace(4) byref(i64) %"37") #0 { -"45": %"11" = alloca i1, align 1, addrspace(5) - store i1 false, ptr addrspace(5) %"11", align 1 %"4" = alloca i64, align 8, addrspace(5) %"5" = alloca i64, align 8, addrspace(5) %"6" = alloca i32, align 4, addrspace(5) @@ -12,6 +10,10 @@ define protected amdgpu_kernel void @shr_u32(ptr addrspace(4) byref(i64) %"36", %"8" = alloca i32, align 4, addrspace(5) %"9" = alloca i32, align 4, addrspace(5) %"10" = alloca i32, align 4, addrspace(5) + br label %1 + +1: ; preds = %0 + store i1 false, ptr addrspace(5) %"11", align 1 %"12" = load i64, ptr addrspace(4) %"36", align 8 store i64 %"12", ptr addrspace(5) %"4", align 8 %"13" = load i64, ptr addrspace(4) %"37", align 8 @@ -22,25 +24,25 @@ define protected amdgpu_kernel void @shr_u32(ptr addrspace(4) byref(i64) %"36", store i32 %"14", ptr addrspace(5) %"6", align 4 %"17" = load i64, ptr addrspace(5) %"4", align 8 %"39" = inttoptr i64 %"17" to ptr - %"47" = getelementptr inbounds i8, ptr %"39", i64 4 - %"16" = load i32, ptr %"47", align 4 + %"46" = getelementptr inbounds i8, ptr %"39", i64 4 + %"16" = load i32, ptr %"46", align 4 store i32 %"16", ptr addrspace(5) %"7", align 4 %"19" = load i64, ptr addrspace(5) %"4", align 8 %"40" = inttoptr i64 %"19" to ptr - %"49" = getelementptr inbounds i8, ptr %"40", i64 8 - %"18" = load i32, ptr %"49", align 4 + %"48" = getelementptr inbounds i8, ptr %"40", i64 8 + %"18" = load i32, ptr %"48", align 4 store i32 %"18", ptr addrspace(5) %"8", align 4 %"21" = load i32, ptr addrspace(5) %"6", align 4 %"22" = load i32, ptr addrspace(5) %"7", align 4 - %0 = icmp ugt i32 %"22", 31 - %1 = lshr i32 %"21", %"22" - %"20" = select i1 %0, i32 0, i32 %1 + %2 = icmp ugt i32 %"22", 31 + %3 = lshr i32 %"21", %"22" + %"20" = select i1 %2, i32 0, i32 %3 store i32 %"20", ptr addrspace(5) %"9", align 4 %"24" = load i32, ptr addrspace(5) %"6", align 4 %"25" = load i32, ptr addrspace(5) %"8", align 4 - %2 = icmp ugt i32 %"25", 31 - %3 = lshr i32 %"24", %"25" - %"23" = select i1 %2, i32 0, i32 %3 + %4 = icmp ugt i32 %"25", 31 + %5 = lshr i32 %"24", %"25" + %"23" = select i1 %4, i32 0, i32 %5 store i32 %"23", ptr addrspace(5) %"10", align 4 %"26" = load i64, ptr addrspace(5) %"5", align 8 %"27" = load i32, ptr addrspace(5) %"9", align 4 @@ -49,8 +51,8 @@ define protected amdgpu_kernel void @shr_u32(ptr addrspace(4) byref(i64) %"36", %"28" = load i64, ptr addrspace(5) %"5", align 8 %"29" = load i32, ptr addrspace(5) %"10", align 4 %"44" = inttoptr i64 %"28" to ptr - %"51" = getelementptr inbounds i8, ptr %"44", i64 4 - store i32 %"29", ptr %"51", align 4 + %"50" = getelementptr inbounds i8, ptr %"44", i64 4 + store i32 %"29", ptr %"50", align 4 ret void } |