ZLUDA/ptx/src/test/ll/shared_unify_extern.ll
Joëlle van Essen 867e4728d5
LLVM unit tests (#324)
* LLVM unit tests: add assembly files

* LLVM unit tests: first attempt

* LLVM unit tests: fix - parse bitcode in context

* LLVM unit tests: use pretty_assertions for line-by-line diff

* LLVM unit tests: Write IR to file for failed test

* LLVM unit tests: just use the stack

* LLVM unit tests: use MaybeUninit

* LLVM unit tests: add mul24.ll

* LLVM unit tests: Adjustments after review

* LLVM unit tests: Include emit_llvm::Context in emit_llvm::Module

* LLVM unit tests: Fix typo

* LLVM unit tests: Context need not be pub
2025-02-19 21:21:20 +01:00

80 lines
3.1 KiB
LLVM

@shared_ex = external addrspace(3) global [0 x i32]
@shared_mod = external addrspace(3) global [4 x i32]
declare i32 @__zluda_ptx_impl_sreg_tid(i8) #0
declare i32 @__zluda_ptx_impl_sreg_ntid(i8) #0
declare i32 @__zluda_ptx_impl_sreg_ctaid(i8) #0
declare i32 @__zluda_ptx_impl_sreg_nctaid(i8) #0
declare i32 @__zluda_ptx_impl_sreg_clock() #0
declare i32 @__zluda_ptx_impl_sreg_lanemask_lt() #0
define i64 @__zluda_ptx_impl_add() #0 {
%"46" = alloca i64, align 8, addrspace(5)
%"47" = alloca i64, align 8, addrspace(5)
%"48" = alloca i64, align 8, addrspace(5)
br label %1
1: ; preds = %0
%"49" = load i64, ptr addrspace(3) @shared_mod, align 4
store i64 %"49", ptr addrspace(5) %"47", align 4
%"50" = load i64, ptr addrspace(3) @shared_ex, align 4
store i64 %"50", ptr addrspace(5) %"48", align 4
%"52" = load i64, ptr addrspace(5) %"48", align 4
%"53" = load i64, ptr addrspace(5) %"47", align 4
%"75" = add i64 %"52", %"53"
store i64 %"75", ptr addrspace(5) %"46", align 4
%2 = load i64, ptr addrspace(5) %"46", align 4
ret i64 %2
}
define i64 @__zluda_ptx_impl_set_shared_temp1(i64 %"15") #0 {
%"54" = alloca i64, align 8, addrspace(5)
br label %1
1: ; preds = %0
store i64 %"15", ptr addrspace(3) @shared_ex, align 4
%"55" = call i64 @__zluda_ptx_impl_add()
store i64 %"55", ptr addrspace(5) %"54", align 4
%2 = load i64, ptr addrspace(5) %"54", align 4
ret i64 %2
}
define amdgpu_kernel void @shared_unify_extern(ptr addrspace(4) byref(i64) %"56", ptr addrspace(4) byref(i64) %"57") #0 {
%"58" = alloca i64, align 8, addrspace(5)
%"59" = alloca i64, align 8, addrspace(5)
%"60" = alloca i64, align 8, addrspace(5)
%"61" = alloca i64, align 8, addrspace(5)
br label %1
1: ; preds = %0
%"62" = load i64, ptr addrspace(4) %"56", align 4
store i64 %"62", ptr addrspace(5) %"58", align 4
%"63" = load i64, ptr addrspace(4) %"57", align 4
store i64 %"63", ptr addrspace(5) %"59", align 4
%"65" = load i64, ptr addrspace(5) %"58", align 4
%"78" = inttoptr i64 %"65" to ptr addrspace(1)
%"64" = load i64, ptr addrspace(1) %"78", align 4
store i64 %"64", ptr addrspace(5) %"60", align 4
%"66" = load i64, ptr addrspace(5) %"58", align 4
%"79" = inttoptr i64 %"66" to ptr addrspace(1)
%"39" = getelementptr inbounds i8, ptr addrspace(1) %"79", i64 8
%"67" = load i64, ptr addrspace(1) %"39", align 4
store i64 %"67", ptr addrspace(5) %"61", align 4
%"68" = load i64, ptr addrspace(5) %"61", align 4
store i64 %"68", ptr addrspace(3) @shared_mod, align 4
%"70" = load i64, ptr addrspace(5) %"60", align 4
%"81" = call i64 @__zluda_ptx_impl_set_shared_temp1(i64 %"70")
store i64 %"81", ptr addrspace(5) %"61", align 4
%"71" = load i64, ptr addrspace(5) %"59", align 4
%"72" = load i64, ptr addrspace(5) %"61", align 4
%"83" = inttoptr i64 %"71" to ptr
store i64 %"72", ptr %"83", align 4
ret void
}
attributes #0 = { "amdgpu-unsafe-fp-atomics"="true" "no-trapping-math"="true" "uniform-work-group-size"="true" }