|
| 1 | +; RUN: sycl-post-link --device-globals --split=source -S %s -o %t.files.table |
| 2 | +; RUN: FileCheck %s -input-file=%t.files_0.ll --check-prefix CHECK-MOD0 |
| 3 | +; RUN: FileCheck %s -input-file=%t.files_1.ll --check-prefix CHECK-MOD1 |
| 4 | + |
| 5 | +; This test is intended to check that sycl-post-link generates no errors |
| 6 | +; when a device global variable with the 'device_image_scope' property |
| 7 | +; is used in many kernels grouped to one module. |
| 8 | + |
| 9 | +target datalayout = "e-i64:64-v16:16-v24:32-v32:32-v48:64-v96:128-v192:256-v256:256-v512:512-v1024:1024-n8:16:32:64" |
| 10 | +target triple = "spir64-unknown-unknown" |
| 11 | + |
| 12 | +%"class.cl::sycl::ext::oneapi::device_global" = type { i32 } |
| 13 | +%"class.cl::sycl::detail::accessor_common" = type { i8 } |
| 14 | + |
| 15 | +$_ZTSZ7kernel1RN2cl4sycl5queueEEUlvE_ = comdat any |
| 16 | +$_ZTSZ7kernel2RN2cl4sycl5queueEEUlvE_ = comdat any |
| 17 | +$_ZTSZ7kernel3RN2cl4sycl5queueEEUlvE_ = comdat any |
| 18 | +$_ZTSZ7kernel4RN2cl4sycl5queueEEUlvE_ = comdat any |
| 19 | + |
| 20 | +$dg_int2 = comdat any |
| 21 | +@dg_int2 = linkonce_odr dso_local addrspace(1) constant %"class.cl::sycl::ext::oneapi::device_global" zeroinitializer, comdat, align 4 #0 |
| 22 | +; CHECK-MOD0: @dg_int2 = linkonce_odr dso_local addrspace(1) constant %"class.cl::sycl::ext::oneapi::device_global" zeroinitializer, comdat, align 4 |
| 23 | +; CHECK-MOD1-NOT: @dg_int2 |
| 24 | + |
| 25 | +; Third kernel that uses no device-global variables |
| 26 | +define weak_odr dso_local spir_kernel void @_ZTSZ7kernel3RN2cl4sycl5queueEEUlvE_() #3 comdat !kernel_arg_buffer_location !6 { |
| 27 | +entry: |
| 28 | + ret void |
| 29 | +} |
| 30 | + |
| 31 | +; Function Attrs: convergent mustprogress noinline norecurse optnone |
| 32 | +define weak_odr dso_local spir_kernel void @_ZTSZ7kernel4RN2cl4sycl5queueEEUlvE_() #2 comdat !kernel_arg_buffer_location !6 { |
| 33 | +entry: |
| 34 | + %0 = alloca %"class.cl::sycl::detail::accessor_common", align 1 |
| 35 | + %1 = addrspacecast %"class.cl::sycl::detail::accessor_common"* %0 to %"class.cl::sycl::detail::accessor_common" addrspace(4)* |
| 36 | + call spir_func void @_ZZ7kernel1RN2cl4sycl5queueEENKUlvE_clEv(%"class.cl::sycl::detail::accessor_common" addrspace(4)* align 1 dereferenceable_or_null(1) %1) #4 |
| 37 | + ret void |
| 38 | +} |
| 39 | + |
| 40 | +; Function Attrs: convergent mustprogress noinline norecurse optnone |
| 41 | +define weak_odr dso_local spir_kernel void @_ZTSZ7kernel1RN2cl4sycl5queueEEUlvE_() #2 comdat !kernel_arg_buffer_location !6 { |
| 42 | +entry: |
| 43 | + %0 = alloca %"class.cl::sycl::detail::accessor_common", align 1 |
| 44 | + %1 = addrspacecast %"class.cl::sycl::detail::accessor_common"* %0 to %"class.cl::sycl::detail::accessor_common" addrspace(4)* |
| 45 | + call spir_func void @_ZZ7kernel1RN2cl4sycl5queueEENKUlvE_clEv(%"class.cl::sycl::detail::accessor_common" addrspace(4)* align 1 dereferenceable_or_null(1) %1) #4 |
| 46 | + ret void |
| 47 | +} |
| 48 | + |
| 49 | +; Function Attrs: convergent mustprogress noinline norecurse nounwind optnone |
| 50 | +define internal spir_func void @_ZZ7kernel1RN2cl4sycl5queueEENKUlvE_clEv(%"class.cl::sycl::detail::accessor_common" addrspace(4)* align 1 dereferenceable_or_null(1) %this) #1 align 2 { |
| 51 | +entry: |
| 52 | + %this.addr = alloca %"class.cl::sycl::detail::accessor_common" addrspace(4)*, align 8 |
| 53 | + %this.addr.ascast = addrspacecast %"class.cl::sycl::detail::accessor_common" addrspace(4)** %this.addr to %"class.cl::sycl::detail::accessor_common" addrspace(4)* addrspace(4)* |
| 54 | + store %"class.cl::sycl::detail::accessor_common" addrspace(4)* %this, %"class.cl::sycl::detail::accessor_common" addrspace(4)* addrspace(4)* %this.addr.ascast, align 8 |
| 55 | + %this1 = load %"class.cl::sycl::detail::accessor_common" addrspace(4)*, %"class.cl::sycl::detail::accessor_common" addrspace(4)* addrspace(4)* %this.addr.ascast, align 8 |
| 56 | + call spir_func void @_Z14kernel1_level1v() #4 |
| 57 | + ret void |
| 58 | +} |
| 59 | + |
| 60 | +; Function Attrs: convergent mustprogress noinline norecurse nounwind optnone |
| 61 | +define dso_local spir_func void @_Z14kernel1_level1v() #1 { |
| 62 | +entry: |
| 63 | + %dg_int_ptr = alloca %"class.cl::sycl::ext::oneapi::device_global" addrspace(4)*, align 8 |
| 64 | + %dg_int_ptr.ascast = addrspacecast %"class.cl::sycl::ext::oneapi::device_global" addrspace(4)** %dg_int_ptr to %"class.cl::sycl::ext::oneapi::device_global" addrspace(4)* addrspace(4)* |
| 65 | + store %"class.cl::sycl::ext::oneapi::device_global" addrspace(4)* addrspacecast (%"class.cl::sycl::ext::oneapi::device_global" addrspace(1)* @dg_int2 to %"class.cl::sycl::ext::oneapi::device_global" addrspace(4)*), %"class.cl::sycl::ext::oneapi::device_global" addrspace(4)* addrspace(4)* %dg_int_ptr.ascast, align 8 |
| 66 | + %0 = load %"class.cl::sycl::ext::oneapi::device_global" addrspace(4)*, %"class.cl::sycl::ext::oneapi::device_global" addrspace(4)* addrspace(4)* %dg_int_ptr.ascast, align 8 |
| 67 | + %call = call spir_func align 4 dereferenceable(4) i32 addrspace(4)* @_ZNK2cl4sycl3ext6oneapi13device_globalIiJNS2_8PropertyIPKcXadsoS5_L_ZL5Name1EEEXadsoS5_L_ZL6Value1EEEEENS4_I11host_accessXadsoS5_L_ZL5Name2EEELS8_1EEENS4_IS6_XadsoS5_L_ZL5Name3EEEXadsoS5_L_ZL6Value3EEEEENS4_IS6_XadsoS5_L_ZL5Name4EEEXadsoS5_L_ZL6Value4EEEEEEE3getEv(%"class.cl::sycl::ext::oneapi::device_global" addrspace(4)* align 4 dereferenceable_or_null(4) %0) #6 |
| 68 | + ret void |
| 69 | +} |
| 70 | + |
| 71 | +; Function Attrs: convergent mustprogress noinline norecurse nounwind optnone |
| 72 | +define internal spir_func align 4 dereferenceable(4) i32 addrspace(4)* @_ZNK2cl4sycl3ext6oneapi13device_globalIiJNS2_8PropertyIPKcXadsoS5_L_ZL5Name1EEEXadsoS5_L_ZL6Value1EEEEENS4_I11host_accessXadsoS5_L_ZL5Name2EEELS8_1EEENS4_IS6_XadsoS5_L_ZL5Name3EEEXadsoS5_L_ZL6Value3EEEEENS4_IS6_XadsoS5_L_ZL5Name4EEEXadsoS5_L_ZL6Value4EEEEEEE3getEv(%"class.cl::sycl::ext::oneapi::device_global" addrspace(4)* align 4 dereferenceable_or_null(4) %this) #1 align 2 { |
| 73 | +entry: |
| 74 | + %retval = alloca i32 addrspace(4)*, align 8 |
| 75 | + %this.addr = alloca %"class.cl::sycl::ext::oneapi::device_global" addrspace(4)*, align 8 |
| 76 | + %retval.ascast = addrspacecast i32 addrspace(4)** %retval to i32 addrspace(4)* addrspace(4)* |
| 77 | + %this.addr.ascast = addrspacecast %"class.cl::sycl::ext::oneapi::device_global" addrspace(4)** %this.addr to %"class.cl::sycl::ext::oneapi::device_global" addrspace(4)* addrspace(4)* |
| 78 | + store %"class.cl::sycl::ext::oneapi::device_global" addrspace(4)* %this, %"class.cl::sycl::ext::oneapi::device_global" addrspace(4)* addrspace(4)* %this.addr.ascast, align 8 |
| 79 | + %this1 = load %"class.cl::sycl::ext::oneapi::device_global" addrspace(4)*, %"class.cl::sycl::ext::oneapi::device_global" addrspace(4)* addrspace(4)* %this.addr.ascast, align 8 |
| 80 | + %val = getelementptr inbounds %"class.cl::sycl::ext::oneapi::device_global", %"class.cl::sycl::ext::oneapi::device_global" addrspace(4)* %this1, i32 0, i32 0 |
| 81 | + ret i32 addrspace(4)* %val |
| 82 | +} |
| 83 | + |
| 84 | +; Function Attrs: convergent mustprogress noinline norecurse optnone |
| 85 | +define weak_odr dso_local spir_kernel void @_ZTSZ7kernel2RN2cl4sycl5queueEEUlvE_() #2 comdat !kernel_arg_buffer_location !6 { |
| 86 | +entry: |
| 87 | + %0 = alloca %"class.cl::sycl::detail::accessor_common", align 1 |
| 88 | + %1 = addrspacecast %"class.cl::sycl::detail::accessor_common"* %0 to %"class.cl::sycl::detail::accessor_common" addrspace(4)* |
| 89 | + call spir_func void @_ZZ7kernel2RN2cl4sycl5queueEENKUlvE_clEv(%"class.cl::sycl::detail::accessor_common" addrspace(4)* align 1 dereferenceable_or_null(1) %1) #4 |
| 90 | + ret void |
| 91 | +} |
| 92 | + |
| 93 | +; Function Attrs: convergent mustprogress noinline norecurse nounwind optnone |
| 94 | +define internal spir_func void @_ZZ7kernel2RN2cl4sycl5queueEENKUlvE_clEv(%"class.cl::sycl::detail::accessor_common" addrspace(4)* align 1 dereferenceable_or_null(1) %this) #1 align 2 { |
| 95 | +entry: |
| 96 | + %this.addr = alloca %"class.cl::sycl::detail::accessor_common" addrspace(4)*, align 8 |
| 97 | + %this.addr.ascast = addrspacecast %"class.cl::sycl::detail::accessor_common" addrspace(4)** %this.addr to %"class.cl::sycl::detail::accessor_common" addrspace(4)* addrspace(4)* |
| 98 | + store %"class.cl::sycl::detail::accessor_common" addrspace(4)* %this, %"class.cl::sycl::detail::accessor_common" addrspace(4)* addrspace(4)* %this.addr.ascast, align 8 |
| 99 | + %this1 = load %"class.cl::sycl::detail::accessor_common" addrspace(4)*, %"class.cl::sycl::detail::accessor_common" addrspace(4)* addrspace(4)* %this.addr.ascast, align 8 |
| 100 | + %call = call spir_func align 4 dereferenceable(4) i32 addrspace(4)* @_ZNK2cl4sycl3ext6oneapi13device_globalIiJNS2_8PropertyIPKcXadsoS5_L_ZL5Name1EEEXadsoS5_L_ZL6Value1EEEEENS4_I11host_accessXadsoS5_L_ZL5Name2EEELS8_1EEENS4_IS6_XadsoS5_L_ZL5Name3EEEXadsoS5_L_ZL6Value3EEEEENS4_IS6_XadsoS5_L_ZL5Name4EEEXadsoS5_L_ZL6Value4EEEEEEE3getEv.2(%"class.cl::sycl::ext::oneapi::device_global" addrspace(4)* align 4 dereferenceable_or_null(4) addrspacecast (%"class.cl::sycl::ext::oneapi::device_global" addrspace(1)* @dg_int2 to %"class.cl::sycl::ext::oneapi::device_global" addrspace(4)*)) #5 |
| 101 | + ret void |
| 102 | +} |
| 103 | + |
| 104 | +; Function Attrs: convergent mustprogress noinline norecurse nounwind optnone |
| 105 | +define internal spir_func align 4 dereferenceable(4) i32 addrspace(4)* @_ZNK2cl4sycl3ext6oneapi13device_globalIiJNS2_8PropertyIPKcXadsoS5_L_ZL5Name1EEEXadsoS5_L_ZL6Value1EEEEENS4_I11host_accessXadsoS5_L_ZL5Name2EEELS8_1EEENS4_IS6_XadsoS5_L_ZL5Name3EEEXadsoS5_L_ZL6Value3EEEEENS4_IS6_XadsoS5_L_ZL5Name4EEEXadsoS5_L_ZL6Value4EEEEEEE3getEv.2(%"class.cl::sycl::ext::oneapi::device_global" addrspace(4)* align 4 dereferenceable_or_null(4) %this) #1 align 2 { |
| 106 | +entry: |
| 107 | + %retval = alloca i32 addrspace(4)*, align 8 |
| 108 | + %this.addr = alloca %"class.cl::sycl::ext::oneapi::device_global" addrspace(4)*, align 8 |
| 109 | + %retval.ascast = addrspacecast i32 addrspace(4)** %retval to i32 addrspace(4)* addrspace(4)* |
| 110 | + %this.addr.ascast = addrspacecast %"class.cl::sycl::ext::oneapi::device_global" addrspace(4)** %this.addr to %"class.cl::sycl::ext::oneapi::device_global" addrspace(4)* addrspace(4)* |
| 111 | + store %"class.cl::sycl::ext::oneapi::device_global" addrspace(4)* %this, %"class.cl::sycl::ext::oneapi::device_global" addrspace(4)* addrspace(4)* %this.addr.ascast, align 8 |
| 112 | + %this1 = load %"class.cl::sycl::ext::oneapi::device_global" addrspace(4)*, %"class.cl::sycl::ext::oneapi::device_global" addrspace(4)* addrspace(4)* %this.addr.ascast, align 8 |
| 113 | + %val = getelementptr inbounds %"class.cl::sycl::ext::oneapi::device_global", %"class.cl::sycl::ext::oneapi::device_global" addrspace(4)* %this1, i32 0, i32 0 |
| 114 | + ret i32 addrspace(4)* %val |
| 115 | +} |
| 116 | + |
| 117 | +attributes #0 = { "sycl-unique-id"="dg_int2" "device_image_scope"="true" "host_access"="1" "implement_in_csr"="true" "init_mode"="0" "sycl-device-global-size"="4" } |
| 118 | +attributes #1 = { convergent mustprogress noinline norecurse nounwind optnone "frame-pointer"="all" "min-legal-vector-width"="0" "no-trapping-math"="true" "stack-protector-buffer-size"="8" } |
| 119 | +attributes #2 = { convergent mustprogress noinline norecurse optnone "frame-pointer"="all" "min-legal-vector-width"="0" "no-trapping-math"="true" "stack-protector-buffer-size"="8" "sycl-module-id"="test_global_variable_1.cpp" "uniform-work-group-size"="true" } |
| 120 | +attributes #3 = { convergent mustprogress noinline norecurse optnone "frame-pointer"="all" "min-legal-vector-width"="0" "no-trapping-math"="true" "stack-protector-buffer-size"="8" "sycl-module-id"="test_global_variable_main.cpp" "uniform-work-group-size"="true" } |
| 121 | +attributes #4 = { convergent } |
| 122 | +attributes #5 = { convergent nounwind } |
| 123 | +attributes #6 = { nobuiltin allocsize(0) "frame-pointer"="none" "no-trapping-math"="true" "stack-protector-buffer-size"="8" "target-cpu"="x86-64" "target-features"="+cx8,+fxsr,+mmx,+sse,+sse2,+x87" "tune-cpu"="generic" } |
| 124 | + |
| 125 | +!llvm.dependent-libraries = !{!0} |
| 126 | +!opencl.spir.version = !{!1} |
| 127 | +!spirv.Source = !{!2} |
| 128 | +!llvm.ident = !{!3} |
| 129 | +!llvm.module.flags = !{!4, !5} |
| 130 | + |
| 131 | +!0 = !{!"libcpmt"} |
| 132 | +!1 = !{i32 1, i32 2} |
| 133 | +!2 = !{i32 4, i32 100000} |
| 134 | +!3 = !{!"clang version 14.0.0"} |
| 135 | +!4 = !{i32 1, !"wchar_size", i32 2} |
| 136 | +!5 = !{i32 7, !"frame-pointer", i32 2} |
| 137 | +!6 = !{} |
0 commit comments