|
| 1 | +; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 5 |
| 2 | +; RUN: opt -S -mtriple=amdgcn-amd-amdhsa -passes=amdgpu-promote-alloca < %s | FileCheck %s |
| 3 | + |
| 4 | +; Check that invalid IR is not produced on a vector typed |
| 5 | +; getelementptr with a scalar alloca pointer base. |
| 6 | + |
| 7 | +define amdgpu_kernel void @scalar_alloca_ptr_with_vector_gep_offset() { |
| 8 | +; CHECK-LABEL: define amdgpu_kernel void @scalar_alloca_ptr_with_vector_gep_offset() { |
| 9 | +; CHECK-NEXT: [[BB:.*:]] |
| 10 | +; CHECK-NEXT: [[ALLOCA:%.*]] = alloca i32, align 4, addrspace(5) |
| 11 | +; CHECK-NEXT: [[GETELEMENTPTR:%.*]] = getelementptr inbounds i8, ptr addrspace(5) [[ALLOCA]], <4 x i64> <i64 0, i64 1, i64 2, i64 3> |
| 12 | +; CHECK-NEXT: [[EXTRACTELEMENT:%.*]] = extractelement <4 x ptr addrspace(5)> [[GETELEMENTPTR]], i64 0 |
| 13 | +; CHECK-NEXT: store i32 0, ptr addrspace(5) [[EXTRACTELEMENT]], align 4 |
| 14 | +; CHECK-NEXT: ret void |
| 15 | +; |
| 16 | +bb: |
| 17 | + %alloca = alloca i32, align 4, addrspace(5) |
| 18 | + %getelementptr = getelementptr inbounds i8, ptr addrspace(5) %alloca, <4 x i64> <i64 0, i64 1, i64 2, i64 3> |
| 19 | + %extractelement = extractelement <4 x ptr addrspace(5)> %getelementptr, i64 0 |
| 20 | + store i32 0, ptr addrspace(5) %extractelement |
| 21 | + ret void |
| 22 | +} |
| 23 | + |
| 24 | +define amdgpu_kernel void @scalar_alloca_ptr_with_vector_gep_offset_select(i1 %cond) { |
| 25 | +; CHECK-LABEL: define amdgpu_kernel void @scalar_alloca_ptr_with_vector_gep_offset_select( |
| 26 | +; CHECK-SAME: i1 [[COND:%.*]]) { |
| 27 | +; CHECK-NEXT: [[BB:.*:]] |
| 28 | +; CHECK-NEXT: [[ALLOCA:%.*]] = alloca i32, align 4, addrspace(5) |
| 29 | +; CHECK-NEXT: [[GETELEMENTPTR0:%.*]] = getelementptr inbounds i8, ptr addrspace(5) [[ALLOCA]], <4 x i64> <i64 0, i64 1, i64 2, i64 3> |
| 30 | +; CHECK-NEXT: [[GETELEMENTPTR1:%.*]] = getelementptr inbounds i8, ptr addrspace(5) [[ALLOCA]], <4 x i64> <i64 3, i64 2, i64 1, i64 0> |
| 31 | +; CHECK-NEXT: [[SELECT:%.*]] = select i1 [[COND]], <4 x ptr addrspace(5)> [[GETELEMENTPTR0]], <4 x ptr addrspace(5)> [[GETELEMENTPTR1]] |
| 32 | +; CHECK-NEXT: [[EXTRACTELEMENT:%.*]] = extractelement <4 x ptr addrspace(5)> [[SELECT]], i64 1 |
| 33 | +; CHECK-NEXT: store i32 0, ptr addrspace(5) [[EXTRACTELEMENT]], align 4 |
| 34 | +; CHECK-NEXT: ret void |
| 35 | +; |
| 36 | +bb: |
| 37 | + %alloca = alloca i32, align 4, addrspace(5) |
| 38 | + %getelementptr0 = getelementptr inbounds i8, ptr addrspace(5) %alloca, <4 x i64> <i64 0, i64 1, i64 2, i64 3> |
| 39 | + %getelementptr1 = getelementptr inbounds i8, ptr addrspace(5) %alloca, <4 x i64> <i64 3, i64 2, i64 1, i64 0> |
| 40 | + %select = select i1 %cond, <4 x ptr addrspace(5)> %getelementptr0, <4 x ptr addrspace(5)> %getelementptr1 |
| 41 | + %extractelement = extractelement <4 x ptr addrspace(5)> %select, i64 1 |
| 42 | + store i32 0, ptr addrspace(5) %extractelement |
| 43 | + ret void |
| 44 | +} |
0 commit comments