|
| 1 | +; Adapted from Khronos Translator test suite: test/CodeGen/SPIRV/extensions/SPV_INTEL_split_barrier/ |
| 2 | + |
| 3 | +;; kernel void test(global uint* dst) |
| 4 | +;; { |
| 5 | +;; intel_work_group_barrier_arrive(CLK_LOCAL_MEM_FENCE); |
| 6 | +;; intel_work_group_barrier_wait(CLK_LOCAL_MEM_FENCE); |
| 7 | +;; intel_work_group_barrier_arrive(CLK_GLOBAL_MEM_FENCE); |
| 8 | +;; intel_work_group_barrier_wait(CLK_GLOBAL_MEM_FENCE); |
| 9 | +;; |
| 10 | +;; intel_work_group_barrier_arrive(CLK_LOCAL_MEM_FENCE | CLK_GLOBAL_MEM_FENCE); |
| 11 | +;; intel_work_group_barrier_wait(CLK_LOCAL_MEM_FENCE | CLK_GLOBAL_MEM_FENCE); |
| 12 | +;;} |
| 13 | + |
| 14 | +; RUN: not llc -O0 -mtriple=spirv64-unknown-unknown %s -o %t.spvt 2>&1 | FileCheck %s --check-prefix=CHECK-ERROR |
| 15 | + |
| 16 | +; CHECK-ERROR: LLVM ERROR: intel_work_group_barrier_arrive: the builtin requires the following SPIR-V extension: SPV_INTEL_split_barrier |
| 17 | + |
| 18 | +; RUN: llc -verify-machineinstrs -O0 -mtriple=spirv64-unknown-unknown --spirv-ext=+SPV_INTEL_split_barrier %s -o - | FileCheck %s |
| 19 | +; RUN: %if spirv-tools %{ llc -O0 -mtriple=spirv64-unknown-unknown --spirv-ext=+SPV_INTEL_split_barrier %s -o - -filetype=obj | spirv-val %} |
| 20 | + |
| 21 | +; CHECK: Capability SplitBarrierINTEL |
| 22 | +; CHECK: Extension "SPV_INTEL_split_barrier" |
| 23 | +; CHECK: %[[#UINT:]] = OpTypeInt 32 0 |
| 24 | +; |
| 25 | +; Scopes: |
| 26 | +; CHECK-DAG: %[[#SCOPE_WORK_GROUP:]] = OpConstant %[[#UINT]] 2{{$}} |
| 27 | +; |
| 28 | +; Memory Semantics: |
| 29 | +; 0x2 Acquire + 0x100 WorkgroupMemory |
| 30 | +; CHECK-DAG: %[[#ACQUIRE_LOCAL:]] = OpConstant %[[#UINT]] 258 |
| 31 | +; 0x4 Release + 0x100 WorkgroupMemory |
| 32 | +; CHECK-DAG: %[[#RELEASE_LOCAL:]] = OpConstant %[[#UINT]] 260 |
| 33 | +; 0x2 Acquire + 0x200 CrossWorkgroupMemory |
| 34 | +; CHECK-DAG: %[[#ACQUIRE_GLOBAL:]] = OpConstant %[[#UINT]] 514 |
| 35 | +; 0x4 Release + 0x200 CrossWorkgroupMemory |
| 36 | +; CHECK-DAG: %[[#RELEASE_GLOBAL:]] = OpConstant %[[#UINT]] 516 |
| 37 | +; 0x2 Acquire + 0x100 WorkgroupMemory + 0x200 CrossWorkgroupMemory |
| 38 | +; CHECK-DAG: %[[#ACQUIRE_LOCAL_GLOBAL:]] = OpConstant %[[#UINT]] 770 |
| 39 | +; 0x4 Release + 0x100 WorkgroupMemory + 0x200 CrossWorkgroupMemory |
| 40 | +; CHECK-DAG: %[[#RELEASE_LOCAL_GLOBAL:]] = OpConstant %[[#UINT]] 772 |
| 41 | +; |
| 42 | +; CHECK: OpControlBarrierArriveINTEL %[[#SCOPE_WORK_GROUP]] %[[#SCOPE_WORK_GROUP]] %[[#RELEASE_LOCAL]] |
| 43 | +; CHECK: OpControlBarrierWaitINTEL %[[#SCOPE_WORK_GROUP]] %[[#SCOPE_WORK_GROUP]] %[[#ACQUIRE_LOCAL]] |
| 44 | +; CHECK: OpControlBarrierArriveINTEL %[[#SCOPE_WORK_GROUP]] %[[#SCOPE_WORK_GROUP]] %[[#RELEASE_GLOBAL]] |
| 45 | +; CHECK: OpControlBarrierWaitINTEL %[[#SCOPE_WORK_GROUP]] %[[#SCOPE_WORK_GROUP]] %[[#ACQUIRE_GLOBAL]] |
| 46 | +; |
| 47 | +; CHECK: OpControlBarrierArriveINTEL %[[#SCOPE_WORK_GROUP]] %[[#SCOPE_WORK_GROUP]] %[[#RELEASE_LOCAL_GLOBAL]] |
| 48 | +; CHECK: OpControlBarrierWaitINTEL %[[#SCOPE_WORK_GROUP]] %[[#SCOPE_WORK_GROUP]] %[[#ACQUIRE_LOCAL_GLOBAL]] |
| 49 | + |
| 50 | +; Function Attrs: convergent norecurse nounwind |
| 51 | +define dso_local spir_kernel void @test(ptr addrspace(1) nocapture noundef readnone align 4 %0) local_unnamed_addr #0 !kernel_arg_addr_space !4 !kernel_arg_access_qual !5 !kernel_arg_type !6 !kernel_arg_base_type !6 !kernel_arg_type_qual !7 { |
| 52 | + tail call spir_func void @_Z31intel_work_group_barrier_arrivej(i32 noundef 1) #2 |
| 53 | + tail call spir_func void @_Z29intel_work_group_barrier_waitj(i32 noundef 1) #2 |
| 54 | + tail call spir_func void @_Z31intel_work_group_barrier_arrivej(i32 noundef 2) #2 |
| 55 | + tail call spir_func void @_Z29intel_work_group_barrier_waitj(i32 noundef 2) #2 |
| 56 | + tail call spir_func void @_Z31intel_work_group_barrier_arrivej(i32 noundef 3) #2 |
| 57 | + tail call spir_func void @_Z29intel_work_group_barrier_waitj(i32 noundef 3) #2 |
| 58 | + ret void |
| 59 | +} |
| 60 | + |
| 61 | +; Function Attrs: convergent |
| 62 | +declare dso_local spir_func void @_Z31intel_work_group_barrier_arrivej(i32 noundef) local_unnamed_addr #1 |
| 63 | + |
| 64 | +; Function Attrs: convergent |
| 65 | +declare dso_local spir_func void @_Z29intel_work_group_barrier_waitj(i32 noundef) local_unnamed_addr #1 |
| 66 | + |
| 67 | +attributes #0 = { convergent norecurse nounwind "frame-pointer"="all" "min-legal-vector-width"="0" "no-trapping-math"="true" "stack-protector-buffer-size"="8" "uniform-work-group-size"="true" } |
| 68 | +attributes #1 = { convergent "frame-pointer"="all" "no-trapping-math"="true" "stack-protector-buffer-size"="8" } |
| 69 | +attributes #2 = { convergent nounwind } |
| 70 | + |
| 71 | +!llvm.module.flags = !{!0, !1} |
| 72 | +!opencl.ocl.version = !{!2} |
| 73 | +!opencl.spir.version = !{!2} |
| 74 | +!llvm.ident = !{!3} |
| 75 | + |
| 76 | +!0 = !{i32 1, !"wchar_size", i32 4} |
| 77 | +!1 = !{i32 7, !"frame-pointer", i32 2} |
| 78 | +!2 = !{i32 1, i32 2} |
| 79 | +!3 = !{!"clang version 15.0.0 (https://github.com/llvm/llvm-project 861386dbd6ff0d91636b7c674c2abb2eccd9d3f2)"} |
| 80 | +!4 = !{i32 1} |
| 81 | +!5 = !{!"none"} |
| 82 | +!6 = !{!"uint*"} |
| 83 | +!7 = !{!""} |
0 commit comments