summaryrefslogtreecommitdiff
path: root/r600/lib/synchronization/barrier_impl.ll
blob: 3d8ee66bab6e219d16e7b9725642a12b0de8f5c0 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
declare i32 @__clc_clk_local_mem_fence() nounwind alwaysinline
declare i32 @__clc_clk_global_mem_fence() nounwind alwaysinline
declare void @llvm.AMDGPU.barrier.local() nounwind noduplicate
declare void @llvm.AMDGPU.barrier.global() nounwind noduplicate

define void @barrier(i32 %flags) nounwind noduplicate alwaysinline {
barrier_local_test:
  %CLK_LOCAL_MEM_FENCE = call i32 @__clc_clk_local_mem_fence()
  %0 = and i32 %flags, %CLK_LOCAL_MEM_FENCE
  %1 = icmp ne i32 %0, 0
  br i1 %1, label %barrier_local, label %barrier_global_test

barrier_local:
  call void @llvm.AMDGPU.barrier.local() noduplicate
  br label %barrier_global_test

barrier_global_test:
  %CLK_GLOBAL_MEM_FENCE = call i32 @__clc_clk_global_mem_fence()
  %2 = and i32 %flags, %CLK_GLOBAL_MEM_FENCE
  %3 = icmp ne i32 %2, 0
  br i1 %3, label %barrier_global, label %done

barrier_global:
  call void @llvm.AMDGPU.barrier.global() noduplicate
  br label %done

done:
  ret void
}