@@ -7,12 +7,11 @@ define <4 x i32> @smull(<4 x i16> %x, <4 x i16> *%y) {
7
7
; CHECK-NEXT: fmov d1, d0
8
8
; CHECK-NEXT: mov w8, #1
9
9
; CHECK-NEXT: movi v0.2d, #0000000000000000
10
- ; CHECK-NEXT: dup v1.4h, v1.h[3]
11
10
; CHECK-NEXT: .LBB0_1: // %l1
12
11
; CHECK-NEXT: // =>This Inner Loop Header: Depth=1
13
12
; CHECK-NEXT: ldr d2, [x0]
14
13
; CHECK-NEXT: subs w8, w8, #1
15
- ; CHECK-NEXT: smlal v0.4s, v2.4h, v1.4h
14
+ ; CHECK-NEXT: smlal v0.4s, v2.4h, v1.h[3]
16
15
; CHECK-NEXT: b.eq .LBB0_1
17
16
; CHECK-NEXT: // %bb.2: // %l2
18
17
; CHECK-NEXT: ret
@@ -40,12 +39,11 @@ define <4 x i32> @umull(<4 x i16> %x, <4 x i16> *%y) {
40
39
; CHECK-NEXT: fmov d1, d0
41
40
; CHECK-NEXT: mov w8, #1
42
41
; CHECK-NEXT: movi v0.2d, #0000000000000000
43
- ; CHECK-NEXT: dup v1.4h, v1.h[3]
44
42
; CHECK-NEXT: .LBB1_1: // %l1
45
43
; CHECK-NEXT: // =>This Inner Loop Header: Depth=1
46
44
; CHECK-NEXT: ldr d2, [x0]
47
45
; CHECK-NEXT: subs w8, w8, #1
48
- ; CHECK-NEXT: umlal v0.4s, v2.4h, v1.4h
46
+ ; CHECK-NEXT: umlal v0.4s, v2.4h, v1.h[3]
49
47
; CHECK-NEXT: b.eq .LBB1_1
50
48
; CHECK-NEXT: // %bb.2: // %l2
51
49
; CHECK-NEXT: ret
@@ -73,12 +71,11 @@ define <4 x i32> @sqadd(<4 x i32> %x, <4 x i32> *%y) {
73
71
; CHECK-NEXT: mov v1.16b, v0.16b
74
72
; CHECK-NEXT: mov w8, #1
75
73
; CHECK-NEXT: movi v0.2d, #0000000000000000
76
- ; CHECK-NEXT: dup v1.4s, v1.s[3]
77
74
; CHECK-NEXT: .LBB2_1: // %l1
78
75
; CHECK-NEXT: // =>This Inner Loop Header: Depth=1
79
76
; CHECK-NEXT: ldr q2, [x0]
80
77
; CHECK-NEXT: subs w8, w8, #1
81
- ; CHECK-NEXT: sqrdmulh v2.4s, v2.4s, v1.4s
78
+ ; CHECK-NEXT: sqrdmulh v2.4s, v2.4s, v1.s[3]
82
79
; CHECK-NEXT: sqadd v0.4s, v0.4s, v2.4s
83
80
; CHECK-NEXT: b.eq .LBB2_1
84
81
; CHECK-NEXT: // %bb.2: // %l2
@@ -107,12 +104,11 @@ define <4 x i32> @sqsub(<4 x i32> %x, <4 x i32> *%y) {
107
104
; CHECK-NEXT: mov v1.16b, v0.16b
108
105
; CHECK-NEXT: mov w8, #1
109
106
; CHECK-NEXT: movi v0.2d, #0000000000000000
110
- ; CHECK-NEXT: dup v1.4s, v1.s[3]
111
107
; CHECK-NEXT: .LBB3_1: // %l1
112
108
; CHECK-NEXT: // =>This Inner Loop Header: Depth=1
113
109
; CHECK-NEXT: ldr q2, [x0]
114
110
; CHECK-NEXT: subs w8, w8, #1
115
- ; CHECK-NEXT: sqrdmulh v2.4s, v2.4s, v1.4s
111
+ ; CHECK-NEXT: sqrdmulh v2.4s, v2.4s, v1.s[3]
116
112
; CHECK-NEXT: sqsub v0.4s, v0.4s, v2.4s
117
113
; CHECK-NEXT: b.eq .LBB3_1
118
114
; CHECK-NEXT: // %bb.2: // %l2
@@ -141,12 +137,11 @@ define <4 x i32> @sqdmulh(<4 x i32> %x, <4 x i32> *%y) {
141
137
; CHECK-NEXT: mov v1.16b, v0.16b
142
138
; CHECK-NEXT: mov w8, #1
143
139
; CHECK-NEXT: movi v0.2d, #0000000000000000
144
- ; CHECK-NEXT: dup v1.4s, v1.s[3]
145
140
; CHECK-NEXT: .LBB4_1: // %l1
146
141
; CHECK-NEXT: // =>This Inner Loop Header: Depth=1
147
142
; CHECK-NEXT: ldr q2, [x0]
148
143
; CHECK-NEXT: subs w8, w8, #1
149
- ; CHECK-NEXT: sqdmulh v2.4s, v2.4s, v1.4s
144
+ ; CHECK-NEXT: sqdmulh v2.4s, v2.4s, v1.s[3]
150
145
; CHECK-NEXT: add v0.4s, v0.4s, v2.4s
151
146
; CHECK-NEXT: b.eq .LBB4_1
152
147
; CHECK-NEXT: // %bb.2: // %l2
@@ -175,12 +170,11 @@ define <4 x i32> @sqdmull(<4 x i16> %x, <4 x i16> *%y) {
175
170
; CHECK-NEXT: fmov d1, d0
176
171
; CHECK-NEXT: mov w8, #1
177
172
; CHECK-NEXT: movi v0.2d, #0000000000000000
178
- ; CHECK-NEXT: dup v1.4h, v1.h[3]
179
173
; CHECK-NEXT: .LBB5_1: // %l1
180
174
; CHECK-NEXT: // =>This Inner Loop Header: Depth=1
181
175
; CHECK-NEXT: ldr d2, [x0]
182
176
; CHECK-NEXT: subs w8, w8, #1
183
- ; CHECK-NEXT: sqdmull v2.4s, v2.4h, v1.4h
177
+ ; CHECK-NEXT: sqdmull v2.4s, v2.4h, v1.h[3]
184
178
; CHECK-NEXT: add v0.4s, v0.4s, v2.4s
185
179
; CHECK-NEXT: b.eq .LBB5_1
186
180
; CHECK-NEXT: // %bb.2: // %l2
0 commit comments