Skip to content

Commit 812c302

Browse files
author
Thorsten Schütt
authored
[GlobalIsel][AArch64] legalize ptr add (#89218)
LLVM ERROR: unable to legalize instruction: %275:_(<4 x p0>) = G_PTR_ADD %268:_, %274:_(<4 x s64>) (in function: prepare_for_pass)
1 parent 48b6f4a commit 812c302

File tree

2 files changed

+59
-4
lines changed

2 files changed

+59
-4
lines changed

llvm/lib/Target/AArch64/GISel/AArch64LegalizerInfo.cpp

Lines changed: 3 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -177,7 +177,9 @@ AArch64LegalizerInfo::AArch64LegalizerInfo(const AArch64Subtarget &ST)
177177

178178
getActionDefinitionsBuilder(G_PTR_ADD)
179179
.legalFor({{p0, s64}, {v2p0, v2s64}})
180-
.clampScalar(1, s64, s64);
180+
.clampScalar(1, s64, s64)
181+
.clampNumElements(0, v2p0, v2p0)
182+
.clampNumElements(1, v2s64, v2s64);
181183

182184
getActionDefinitionsBuilder(G_PTRMASK).legalFor({{p0, s64}});
183185

llvm/test/CodeGen/AArch64/GlobalISel/legalize-ptr-add.mir

Lines changed: 56 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -6,12 +6,65 @@ body: |
66
bb.0.entry:
77
; CHECK-LABEL: name: test_ptr_add_vec_p0
88
; CHECK: [[COPY:%[0-9]+]]:_(<2 x p0>) = COPY $q0
9-
; CHECK: [[COPY1:%[0-9]+]]:_(<2 x s64>) = COPY $q1
10-
; CHECK: [[PTR_ADD:%[0-9]+]]:_(<2 x p0>) = G_PTR_ADD [[COPY]], [[COPY1]](<2 x s64>)
11-
; CHECK: $q0 = COPY [[PTR_ADD]](<2 x p0>)
9+
; CHECK-NEXT: [[COPY1:%[0-9]+]]:_(<2 x s64>) = COPY $q1
10+
; CHECK-NEXT: [[PTR_ADD:%[0-9]+]]:_(<2 x p0>) = G_PTR_ADD [[COPY]], [[COPY1]](<2 x s64>)
11+
; CHECK-NEXT: $q0 = COPY [[PTR_ADD]](<2 x p0>)
1212
%0:_(<2 x p0>) = COPY $q0
1313
%1:_(<2 x s64>) = COPY $q1
1414
%3:_(<2 x p0>) = G_PTR_ADD %0, %1(<2 x s64>)
1515
$q0 = COPY %3(<2 x p0>)
1616
1717
...
18+
---
19+
name: test_ptr_add_vec_4xp0
20+
body: |
21+
bb.0.entry:
22+
; CHECK-LABEL: name: test_ptr_add_vec_4xp0
23+
; CHECK: [[COPY:%[0-9]+]]:_(p0) = COPY $x0
24+
; CHECK-NEXT: [[COPY1:%[0-9]+]]:_(p0) = COPY $x1
25+
; CHECK-NEXT: [[COPY2:%[0-9]+]]:_(p0) = COPY $x2
26+
; CHECK-NEXT: [[COPY3:%[0-9]+]]:_(p0) = COPY $x3
27+
; CHECK-NEXT: [[COPY4:%[0-9]+]]:_(s64) = COPY $x4
28+
; CHECK-NEXT: [[COPY5:%[0-9]+]]:_(s64) = COPY $x5
29+
; CHECK-NEXT: [[COPY6:%[0-9]+]]:_(s64) = COPY $x6
30+
; CHECK-NEXT: [[COPY7:%[0-9]+]]:_(s64) = COPY $x7
31+
; CHECK-NEXT: [[BUILD_VECTOR:%[0-9]+]]:_(<2 x p0>) = G_BUILD_VECTOR [[COPY]](p0), [[COPY1]](p0)
32+
; CHECK-NEXT: [[BUILD_VECTOR1:%[0-9]+]]:_(<2 x p0>) = G_BUILD_VECTOR [[COPY2]](p0), [[COPY3]](p0)
33+
; CHECK-NEXT: [[BUILD_VECTOR2:%[0-9]+]]:_(<2 x s64>) = G_BUILD_VECTOR [[COPY4]](s64), [[COPY5]](s64)
34+
; CHECK-NEXT: [[BUILD_VECTOR3:%[0-9]+]]:_(<2 x s64>) = G_BUILD_VECTOR [[COPY6]](s64), [[COPY7]](s64)
35+
; CHECK-NEXT: [[PTR_ADD:%[0-9]+]]:_(<2 x p0>) = G_PTR_ADD [[BUILD_VECTOR]], [[BUILD_VECTOR2]](<2 x s64>)
36+
; CHECK-NEXT: [[PTR_ADD1:%[0-9]+]]:_(<2 x p0>) = G_PTR_ADD [[BUILD_VECTOR1]], [[BUILD_VECTOR3]](<2 x s64>)
37+
; CHECK-NEXT: %zero:_(s64) = G_CONSTANT i64 0
38+
; CHECK-NEXT: %one:_(s64) = G_CONSTANT i64 1
39+
; CHECK-NEXT: %extract0:_(p0) = G_EXTRACT_VECTOR_ELT [[PTR_ADD]](<2 x p0>), %zero(s64)
40+
; CHECK-NEXT: %extract1:_(p0) = G_EXTRACT_VECTOR_ELT [[PTR_ADD]](<2 x p0>), %one(s64)
41+
; CHECK-NEXT: %extract2:_(p0) = G_EXTRACT_VECTOR_ELT [[PTR_ADD1]](<2 x p0>), %zero(s64)
42+
; CHECK-NEXT: %extract3:_(p0) = G_EXTRACT_VECTOR_ELT [[PTR_ADD1]](<2 x p0>), %one(s64)
43+
; CHECK-NEXT: $x0 = COPY %extract0(p0)
44+
; CHECK-NEXT: $x1 = COPY %extract1(p0)
45+
; CHECK-NEXT: $x2 = COPY %extract2(p0)
46+
; CHECK-NEXT: $x3 = COPY %extract3(p0)
47+
%0:_(p0) = COPY $x0
48+
%1:_(p0) = COPY $x1
49+
%2:_(p0) = COPY $x2
50+
%3:_(p0) = COPY $x3
51+
%4:_(s64) = COPY $x4
52+
%5:_(s64) = COPY $x5
53+
%6:_(s64) = COPY $x6
54+
%7:_(s64) = COPY $x7
55+
%ptr:_(<4 x p0>) = G_BUILD_VECTOR %0(p0), %1(p0), %2(p0), %3(p0)
56+
%add:_(<4 x s64>) = G_BUILD_VECTOR %4(s64), %5(s64), %6(s64), %7(s64)
57+
%res:_(<4 x p0>) = G_PTR_ADD %ptr, %add(<4 x s64>)
58+
%zero:_(s64) = G_CONSTANT i64 0
59+
%one:_(s64) = G_CONSTANT i64 1
60+
%two:_(s64) = G_CONSTANT i64 2
61+
%three:_(s64) = G_CONSTANT i64 3
62+
%extract0:_(p0) = G_EXTRACT_VECTOR_ELT %res(<4 x p0>), %zero(s64)
63+
%extract1:_(p0) = G_EXTRACT_VECTOR_ELT %res(<4 x p0>), %one(s64)
64+
%extract2:_(p0) = G_EXTRACT_VECTOR_ELT %res(<4 x p0>), %two(s64)
65+
%extract3:_(p0) = G_EXTRACT_VECTOR_ELT %res(<4 x p0>), %three(s64)
66+
$x0 = COPY %extract0(p0)
67+
$x1 = COPY %extract1(p0)
68+
$x2 = COPY %extract2(p0)
69+
$x3 = COPY %extract3(p0)
70+
...

0 commit comments

Comments
 (0)