@@ -32,23 +32,23 @@ define <4 x i32> @load_array_vec_test() #0 {
32
32
; CHECK-NEXT: [[TMP6:%.*]] = load i32, ptr addrspace(3) [[TMP5]], align 4
33
33
; CHECK-NEXT: [[TMP7:%.*]] = bitcast ptr addrspace(3) getelementptr (i32, ptr addrspace(3) @arrayofVecData.scalarized.1dim, i32 3) to ptr addrspace(3)
34
34
; CHECK-NEXT: [[TMP8:%.*]] = load i32, ptr addrspace(3) [[TMP7]], align 4
35
- ; CHECK-NEXT: [[TMP11 :%.*]] = bitcast ptr addrspace(3) getelementptr inbounds ([6 x float], ptr addrspace(3) @arrayofVecData.scalarized.1dim, i32 1) to ptr addrspace(3)
36
- ; CHECK-NEXT: [[TMP12 :%.*]] = load i32, ptr addrspace(3) [[TMP11 ]], align 4
37
- ; CHECK-NEXT: [[DOTI12 :%.*]] = bitcast ptr addrspace(3) getelementptr (i32, ptr addrspace(3) getelementptr inbounds ([6 x float], ptr addrspace(3) @arrayofVecData.scalarized.1dim, i32 1), i32 1) to ptr addrspace(3)
38
- ; CHECK-NEXT: [[DOTI13 :%.*]] = load i32, ptr addrspace(3) [[DOTI12 ]], align 4
39
- ; CHECK-NEXT: [[DOTI24 :%.*]] = bitcast ptr addrspace(3) getelementptr (i32, ptr addrspace(3) getelementptr inbounds ([6 x float], ptr addrspace(3) @arrayofVecData.scalarized.1dim, i32 1), i32 2) to ptr addrspace(3)
40
- ; CHECK-NEXT: [[DOTI25 :%.*]] = load i32, ptr addrspace(3) [[DOTI24 ]], align 4
41
- ; CHECK-NEXT: [[DOTI36 :%.*]] = bitcast ptr addrspace(3) getelementptr (i32, ptr addrspace(3) getelementptr inbounds ([6 x float], ptr addrspace(3) @arrayofVecData.scalarized.1dim, i32 1), i32 3) to ptr addrspace(3)
42
- ; CHECK-NEXT: [[DOTI37 :%.*]] = load i32, ptr addrspace(3) [[DOTI36 ]], align 4
43
- ; CHECK-NEXT: [[DOTI08 :%.*]] = add i32 [[TMP2]], [[TMP12 ]]
44
- ; CHECK-NEXT: [[DOTI19 :%.*]] = add i32 [[TMP4]], [[DOTI13 ]]
45
- ; CHECK-NEXT: [[DOTI210 :%.*]] = add i32 [[TMP6]], [[DOTI25 ]]
46
- ; CHECK-NEXT: [[DOTI311 :%.*]] = add i32 [[TMP8]], [[DOTI37 ]]
47
- ; CHECK-NEXT: [[DOTUPTO015 :%.*]] = insertelement <4 x i32> poison, i32 [[DOTI08 ]], i32 0
48
- ; CHECK-NEXT: [[DOTUPTO116 :%.*]] = insertelement <4 x i32> [[DOTUPTO015 ]], i32 [[DOTI19 ]], i32 1
49
- ; CHECK-NEXT: [[DOTUPTO217 :%.*]] = insertelement <4 x i32> [[DOTUPTO116 ]], i32 [[DOTI210 ]], i32 2
50
- ; CHECK-NEXT: [[TMP16 :%.*]] = insertelement <4 x i32> [[DOTUPTO217 ]], i32 [[DOTI311 ]], i32 3
51
- ; CHECK-NEXT: ret <4 x i32> [[TMP16 ]]
35
+ ; CHECK-NEXT: [[TMP9 :%.*]] = bitcast ptr addrspace(3) getelementptr inbounds ([6 x float], ptr addrspace(3) @arrayofVecData.scalarized.1dim, i32 0 , i32 1) to ptr addrspace(3)
36
+ ; CHECK-NEXT: [[TMP10 :%.*]] = load i32, ptr addrspace(3) [[TMP9 ]], align 4
37
+ ; CHECK-NEXT: [[TMP11 :%.*]] = bitcast ptr addrspace(3) getelementptr (i32, ptr addrspace(3) getelementptr inbounds ([6 x float], ptr addrspace(3) @arrayofVecData.scalarized.1dim, i32 0 , i32 1), i32 1) to ptr addrspace(3)
38
+ ; CHECK-NEXT: [[TMP12 :%.*]] = load i32, ptr addrspace(3) [[TMP11 ]], align 4
39
+ ; CHECK-NEXT: [[TMP13 :%.*]] = bitcast ptr addrspace(3) getelementptr (i32, ptr addrspace(3) getelementptr inbounds ([6 x float], ptr addrspace(3) @arrayofVecData.scalarized.1dim, i32 0 , i32 1), i32 2) to ptr addrspace(3)
40
+ ; CHECK-NEXT: [[TMP14 :%.*]] = load i32, ptr addrspace(3) [[TMP13 ]], align 4
41
+ ; CHECK-NEXT: [[TMP15 :%.*]] = bitcast ptr addrspace(3) getelementptr (i32, ptr addrspace(3) getelementptr inbounds ([6 x float], ptr addrspace(3) @arrayofVecData.scalarized.1dim, i32 0 , i32 1), i32 3) to ptr addrspace(3)
42
+ ; CHECK-NEXT: [[TMP16 :%.*]] = load i32, ptr addrspace(3) [[TMP15 ]], align 4
43
+ ; CHECK-NEXT: [[DOTI05 :%.*]] = add i32 [[TMP2]], [[TMP10 ]]
44
+ ; CHECK-NEXT: [[DOTI16 :%.*]] = add i32 [[TMP4]], [[TMP12 ]]
45
+ ; CHECK-NEXT: [[DOTI27 :%.*]] = add i32 [[TMP6]], [[TMP14 ]]
46
+ ; CHECK-NEXT: [[DOTI38 :%.*]] = add i32 [[TMP8]], [[TMP16 ]]
47
+ ; CHECK-NEXT: [[DOTUPTO01215 :%.*]] = insertelement <4 x i32> poison, i32 [[DOTI05 ]], i32 0
48
+ ; CHECK-NEXT: [[DOTUPTO11316 :%.*]] = insertelement <4 x i32> [[DOTUPTO01215 ]], i32 [[DOTI16 ]], i32 1
49
+ ; CHECK-NEXT: [[DOTUPTO21417 :%.*]] = insertelement <4 x i32> [[DOTUPTO11316 ]], i32 [[DOTI27 ]], i32 2
50
+ ; CHECK-NEXT: [[TMP17 :%.*]] = insertelement <4 x i32> [[DOTUPTO21417 ]], i32 [[DOTI38 ]], i32 3
51
+ ; CHECK-NEXT: ret <4 x i32> [[TMP17 ]]
52
52
;
53
53
%1 = load <4 x i32 >, <4 x i32 > addrspace (3 )* getelementptr inbounds ([2 x <4 x i32 >], [2 x <4 x i32 >] addrspace (3 )* @"arrayofVecData" , i32 0 , i32 0 ), align 4
54
54
%2 = load <4 x i32 >, <4 x i32 > addrspace (3 )* getelementptr inbounds ([2 x <4 x i32 >], [2 x <4 x i32 >] addrspace (3 )* @"arrayofVecData" , i32 0 , i32 1 ), align 4
@@ -81,23 +81,19 @@ define <4 x i32> @load_vec_test() #0 {
81
81
define <4 x i32 > @load_static_array_of_vec_test (i32 %index ) #0 {
82
82
; CHECK-LABEL: define <4 x i32> @load_static_array_of_vec_test(
83
83
; CHECK-SAME: i32 [[INDEX:%.*]]) #[[ATTR0]] {
84
- ; CHECK-NEXT: [[DOTFLAT:%.*]] = getelementptr inbounds [12 x i32], ptr @staticArrayOfVecData.scalarized.1dim, i32 [[INDEX]]
85
- ; CHECK-NEXT: [[TMP1:%.*]] = bitcast ptr [[DOTFLAT]] to ptr
86
- ; CHECK-NEXT: [[TMP2:%.*]] = load i32, ptr [[TMP1]], align 4
87
- ; CHECK-NEXT: [[TMP3:%.*]] = bitcast ptr [[DOTFLAT]] to ptr
88
- ; CHECK-NEXT: [[DOTFLAT_I1:%.*]] = getelementptr i32, ptr [[TMP3]], i32 1
89
- ; CHECK-NEXT: [[DOTI1:%.*]] = load i32, ptr [[DOTFLAT_I1]], align 4
90
- ; CHECK-NEXT: [[TMP4:%.*]] = bitcast ptr [[DOTFLAT]] to ptr
91
- ; CHECK-NEXT: [[DOTFLAT_I2:%.*]] = getelementptr i32, ptr [[TMP4]], i32 2
92
- ; CHECK-NEXT: [[DOTI2:%.*]] = load i32, ptr [[DOTFLAT_I2]], align 4
93
- ; CHECK-NEXT: [[TMP5:%.*]] = bitcast ptr [[DOTFLAT]] to ptr
94
- ; CHECK-NEXT: [[DOTFLAT_I3:%.*]] = getelementptr i32, ptr [[TMP5]], i32 3
95
- ; CHECK-NEXT: [[DOTI3:%.*]] = load i32, ptr [[DOTFLAT_I3]], align 4
96
- ; CHECK-NEXT: [[DOTUPTO0:%.*]] = insertelement <4 x i32> poison, i32 [[TMP2]], i32 0
97
- ; CHECK-NEXT: [[DOTUPTO1:%.*]] = insertelement <4 x i32> [[DOTUPTO0]], i32 [[DOTI1]], i32 1
98
- ; CHECK-NEXT: [[DOTUPTO2:%.*]] = insertelement <4 x i32> [[DOTUPTO1]], i32 [[DOTI2]], i32 2
99
- ; CHECK-NEXT: [[TMP6:%.*]] = insertelement <4 x i32> [[DOTUPTO2]], i32 [[DOTI3]], i32 3
100
- ; CHECK-NEXT: ret <4 x i32> [[TMP6]]
84
+ ; CHECK-NEXT: [[DOTFLAT:%.*]] = getelementptr inbounds [12 x i32], ptr @staticArrayOfVecData.scalarized.1dim, i32 0, i32 [[INDEX]]
85
+ ; CHECK-NEXT: [[DOTI0:%.*]] = load i32, ptr [[DOTFLAT]], align 4
86
+ ; CHECK-NEXT: [[DOTFLAT_I1:%.*]] = getelementptr i32, ptr [[DOTFLAT]], i32 1
87
+ ; CHECK-NEXT: [[DOTI1:%.*]] = load i32, ptr [[DOTFLAT_I1]], align 4
88
+ ; CHECK-NEXT: [[DOTFLAT_I2:%.*]] = getelementptr i32, ptr [[DOTFLAT]], i32 2
89
+ ; CHECK-NEXT: [[DOTI2:%.*]] = load i32, ptr [[DOTFLAT_I2]], align 4
90
+ ; CHECK-NEXT: [[DOTFLAT_I3:%.*]] = getelementptr i32, ptr [[DOTFLAT]], i32 3
91
+ ; CHECK-NEXT: [[DOTI3:%.*]] = load i32, ptr [[DOTFLAT_I3]], align 4
92
+ ; CHECK-NEXT: [[DOTUPTO01:%.*]] = insertelement <4 x i32> poison, i32 [[DOTI0]], i32 0
93
+ ; CHECK-NEXT: [[DOTUPTO12:%.*]] = insertelement <4 x i32> [[DOTUPTO01]], i32 [[DOTI1]], i32 1
94
+ ; CHECK-NEXT: [[DOTUPTO23:%.*]] = insertelement <4 x i32> [[DOTUPTO12]], i32 [[DOTI2]], i32 2
95
+ ; CHECK-NEXT: [[TMP1:%.*]] = insertelement <4 x i32> [[DOTUPTO23]], i32 [[DOTI3]], i32 3
96
+ ; CHECK-NEXT: ret <4 x i32> [[TMP1]]
101
97
;
102
98
%3 = getelementptr inbounds [3 x <4 x i32 >], [3 x <4 x i32 >]* @staticArrayOfVecData , i32 0 , i32 %index
103
99
%4 = load <4 x i32 >, <4 x i32 >* %3 , align 4
@@ -115,23 +111,23 @@ define <4 x i32> @multid_load_test() #0 {
115
111
; CHECK-NEXT: [[TMP6:%.*]] = load i32, ptr addrspace(3) [[TMP5]], align 4
116
112
; CHECK-NEXT: [[TMP7:%.*]] = bitcast ptr addrspace(3) getelementptr (i32, ptr addrspace(3) @groushared2dArrayofVectors.scalarized.1dim, i32 3) to ptr addrspace(3)
117
113
; CHECK-NEXT: [[TMP8:%.*]] = load i32, ptr addrspace(3) [[TMP7]], align 4
118
- ; CHECK-NEXT: [[TMP11 :%.*]] = bitcast ptr addrspace(3) getelementptr inbounds ([36 x i32], ptr addrspace(3) @groushared2dArrayofVectors.scalarized.1dim, i32 1) to ptr addrspace(3)
119
- ; CHECK-NEXT: [[TMP12 :%.*]] = load i32, ptr addrspace(3) [[TMP11 ]], align 4
120
- ; CHECK-NEXT: [[DOTI12 :%.*]] = bitcast ptr addrspace(3) getelementptr (i32, ptr addrspace(3) getelementptr inbounds ([36 x i32], ptr addrspace(3) @groushared2dArrayofVectors.scalarized.1dim, i32 1), i32 1) to ptr addrspace(3)
121
- ; CHECK-NEXT: [[DOTI13 :%.*]] = load i32, ptr addrspace(3) [[DOTI12 ]], align 4
122
- ; CHECK-NEXT: [[DOTI24 :%.*]] = bitcast ptr addrspace(3) getelementptr (i32, ptr addrspace(3) getelementptr inbounds ([36 x i32], ptr addrspace(3) @groushared2dArrayofVectors.scalarized.1dim, i32 1), i32 2) to ptr addrspace(3)
123
- ; CHECK-NEXT: [[DOTI25 :%.*]] = load i32, ptr addrspace(3) [[DOTI24 ]], align 4
124
- ; CHECK-NEXT: [[DOTI36 :%.*]] = bitcast ptr addrspace(3) getelementptr (i32, ptr addrspace(3) getelementptr inbounds ([36 x i32], ptr addrspace(3) @groushared2dArrayofVectors.scalarized.1dim, i32 1), i32 3) to ptr addrspace(3)
125
- ; CHECK-NEXT: [[DOTI37 :%.*]] = load i32, ptr addrspace(3) [[DOTI36 ]], align 4
126
- ; CHECK-NEXT: [[DOTI08 :%.*]] = add i32 [[TMP2]], [[TMP12 ]]
127
- ; CHECK-NEXT: [[DOTI19 :%.*]] = add i32 [[TMP4]], [[DOTI13 ]]
128
- ; CHECK-NEXT: [[DOTI210 :%.*]] = add i32 [[TMP6]], [[DOTI25 ]]
129
- ; CHECK-NEXT: [[DOTI311 :%.*]] = add i32 [[TMP8]], [[DOTI37 ]]
130
- ; CHECK-NEXT: [[DOTUPTO015 :%.*]] = insertelement <4 x i32> poison, i32 [[DOTI08 ]], i32 0
131
- ; CHECK-NEXT: [[DOTUPTO116 :%.*]] = insertelement <4 x i32> [[DOTUPTO015 ]], i32 [[DOTI19 ]], i32 1
132
- ; CHECK-NEXT: [[DOTUPTO217 :%.*]] = insertelement <4 x i32> [[DOTUPTO116 ]], i32 [[DOTI210 ]], i32 2
133
- ; CHECK-NEXT: [[TMP16 :%.*]] = insertelement <4 x i32> [[DOTUPTO217 ]], i32 [[DOTI311 ]], i32 3
134
- ; CHECK-NEXT: ret <4 x i32> [[TMP16 ]]
114
+ ; CHECK-NEXT: [[TMP9 :%.*]] = bitcast ptr addrspace(3) getelementptr inbounds ([36 x i32], ptr addrspace(3) @groushared2dArrayofVectors.scalarized.1dim, i32 0 , i32 1) to ptr addrspace(3)
115
+ ; CHECK-NEXT: [[TMP10 :%.*]] = load i32, ptr addrspace(3) [[TMP9 ]], align 4
116
+ ; CHECK-NEXT: [[TMP11 :%.*]] = bitcast ptr addrspace(3) getelementptr (i32, ptr addrspace(3) getelementptr inbounds ([36 x i32], ptr addrspace(3) @groushared2dArrayofVectors.scalarized.1dim, i32 0 , i32 1), i32 1) to ptr addrspace(3)
117
+ ; CHECK-NEXT: [[TMP12 :%.*]] = load i32, ptr addrspace(3) [[TMP11 ]], align 4
118
+ ; CHECK-NEXT: [[TMP13 :%.*]] = bitcast ptr addrspace(3) getelementptr (i32, ptr addrspace(3) getelementptr inbounds ([36 x i32], ptr addrspace(3) @groushared2dArrayofVectors.scalarized.1dim, i32 0 , i32 1), i32 2) to ptr addrspace(3)
119
+ ; CHECK-NEXT: [[TMP14 :%.*]] = load i32, ptr addrspace(3) [[TMP13 ]], align 4
120
+ ; CHECK-NEXT: [[TMP15 :%.*]] = bitcast ptr addrspace(3) getelementptr (i32, ptr addrspace(3) getelementptr inbounds ([36 x i32], ptr addrspace(3) @groushared2dArrayofVectors.scalarized.1dim, i32 0 , i32 1), i32 3) to ptr addrspace(3)
121
+ ; CHECK-NEXT: [[TMP16 :%.*]] = load i32, ptr addrspace(3) [[TMP15 ]], align 4
122
+ ; CHECK-NEXT: [[DOTI05 :%.*]] = add i32 [[TMP2]], [[TMP10 ]]
123
+ ; CHECK-NEXT: [[DOTI16 :%.*]] = add i32 [[TMP4]], [[TMP12 ]]
124
+ ; CHECK-NEXT: [[DOTI27 :%.*]] = add i32 [[TMP6]], [[TMP14 ]]
125
+ ; CHECK-NEXT: [[DOTI38 :%.*]] = add i32 [[TMP8]], [[TMP16 ]]
126
+ ; CHECK-NEXT: [[DOTUPTO01215 :%.*]] = insertelement <4 x i32> poison, i32 [[DOTI05 ]], i32 0
127
+ ; CHECK-NEXT: [[DOTUPTO11316 :%.*]] = insertelement <4 x i32> [[DOTUPTO01215 ]], i32 [[DOTI16 ]], i32 1
128
+ ; CHECK-NEXT: [[DOTUPTO21417 :%.*]] = insertelement <4 x i32> [[DOTUPTO11316 ]], i32 [[DOTI27 ]], i32 2
129
+ ; CHECK-NEXT: [[TMP17 :%.*]] = insertelement <4 x i32> [[DOTUPTO21417 ]], i32 [[DOTI38 ]], i32 3
130
+ ; CHECK-NEXT: ret <4 x i32> [[TMP17 ]]
135
131
;
136
132
%1 = load <4 x i32 >, <4 x i32 > addrspace (3 )* getelementptr inbounds ([3 x [3 x <4 x i32 >]], [3 x [3 x <4 x i32 >]] addrspace (3 )* @"groushared2dArrayofVectors" , i32 0 , i32 0 , i32 0 ), align 4
137
133
%2 = load <4 x i32 >, <4 x i32 > addrspace (3 )* getelementptr inbounds ([3 x [3 x <4 x i32 >]], [3 x [3 x <4 x i32 >]] addrspace (3 )* @"groushared2dArrayofVectors" , i32 0 , i32 1 , i32 1 ), align 4
0 commit comments