mirror of
https://github.com/vosen/ZLUDA.git
synced 2025-04-28 13:37:57 +03:00
84 lines
No EOL
3.4 KiB
LLVM
84 lines
No EOL
3.4 KiB
LLVM
@shared_ex = external addrspace(3) global [0 x i32]
|
|
@shared_mod = external addrspace(3) global [4 x i32]
|
|
|
|
define i64 @add() #0 {
|
|
%"46" = alloca i64, align 8, addrspace(5)
|
|
%"47" = alloca i64, align 8, addrspace(5)
|
|
%"48" = alloca i64, align 8, addrspace(5)
|
|
br label %1
|
|
|
|
1: ; preds = %0
|
|
br label %"41"
|
|
|
|
"41": ; preds = %1
|
|
%"49" = load i64, ptr addrspace(3) @shared_mod, align 4
|
|
store i64 %"49", ptr addrspace(5) %"47", align 4
|
|
%"50" = load i64, ptr addrspace(3) @shared_ex, align 4
|
|
store i64 %"50", ptr addrspace(5) %"48", align 4
|
|
%"52" = load i64, ptr addrspace(5) %"48", align 4
|
|
%"53" = load i64, ptr addrspace(5) %"47", align 4
|
|
%"75" = add i64 %"52", %"53"
|
|
store i64 %"75", ptr addrspace(5) %"46", align 4
|
|
%2 = load i64, ptr addrspace(5) %"46", align 4
|
|
ret i64 %2
|
|
}
|
|
|
|
define i64 @set_shared_temp1(i64 %"15") #0 {
|
|
%"54" = alloca i64, align 8, addrspace(5)
|
|
br label %1
|
|
|
|
1: ; preds = %0
|
|
br label %"42"
|
|
|
|
"42": ; preds = %1
|
|
store i64 %"15", ptr addrspace(3) @shared_ex, align 4
|
|
%"55" = call i64 @add()
|
|
store i64 %"55", ptr addrspace(5) %"54", align 4
|
|
br label %"43"
|
|
|
|
"43": ; preds = %"42"
|
|
%2 = load i64, ptr addrspace(5) %"54", align 4
|
|
ret i64 %2
|
|
}
|
|
|
|
define amdgpu_kernel void @shared_unify_extern(ptr addrspace(4) byref(i64) %"56", ptr addrspace(4) byref(i64) %"57") #1 {
|
|
%"58" = alloca i64, align 8, addrspace(5)
|
|
%"59" = alloca i64, align 8, addrspace(5)
|
|
%"60" = alloca i64, align 8, addrspace(5)
|
|
%"61" = alloca i64, align 8, addrspace(5)
|
|
br label %1
|
|
|
|
1: ; preds = %0
|
|
br label %"44"
|
|
|
|
"44": ; preds = %1
|
|
%"62" = load i64, ptr addrspace(4) %"56", align 4
|
|
store i64 %"62", ptr addrspace(5) %"58", align 4
|
|
%"63" = load i64, ptr addrspace(4) %"57", align 4
|
|
store i64 %"63", ptr addrspace(5) %"59", align 4
|
|
%"65" = load i64, ptr addrspace(5) %"58", align 4
|
|
%"78" = inttoptr i64 %"65" to ptr addrspace(1)
|
|
%"64" = load i64, ptr addrspace(1) %"78", align 4
|
|
store i64 %"64", ptr addrspace(5) %"60", align 4
|
|
%"66" = load i64, ptr addrspace(5) %"58", align 4
|
|
%"79" = inttoptr i64 %"66" to ptr addrspace(1)
|
|
%"40" = getelementptr inbounds i8, ptr addrspace(1) %"79", i64 8
|
|
%"67" = load i64, ptr addrspace(1) %"40", align 4
|
|
store i64 %"67", ptr addrspace(5) %"61", align 4
|
|
%"68" = load i64, ptr addrspace(5) %"61", align 4
|
|
store i64 %"68", ptr addrspace(3) @shared_mod, align 4
|
|
%"70" = load i64, ptr addrspace(5) %"60", align 4
|
|
%"81" = call i64 @set_shared_temp1(i64 %"70")
|
|
store i64 %"81", ptr addrspace(5) %"61", align 4
|
|
br label %"45"
|
|
|
|
"45": ; preds = %"44"
|
|
%"71" = load i64, ptr addrspace(5) %"59", align 4
|
|
%"72" = load i64, ptr addrspace(5) %"61", align 4
|
|
%"83" = inttoptr i64 %"71" to ptr
|
|
store i64 %"72", ptr %"83", align 4
|
|
ret void
|
|
}
|
|
|
|
attributes #0 = { "amdgpu-unsafe-fp-atomics"="true" "denormal-fp-math"="dynamic" "denormal-fp-math-f32"="dynamic" "no-trapping-math"="true" "uniform-work-group-size"="true" }
|
|
attributes #1 = { "amdgpu-unsafe-fp-atomics"="true" "denormal-fp-math"="preserve-sign" "denormal-fp-math-f32"="preserve-sign" "no-trapping-math"="true" "uniform-work-group-size"="true" } |