3
3
4
4
; Make sure we can load groupshared, static vectors and arrays of vectors
5
5
6
- @"arrayofVecData" = local_unnamed_addr addrspace (3 ) global [2 x <3 x float >] zeroinitializer , align 16
6
+ @"arrayofVecData" = local_unnamed_addr addrspace (3 ) global [2 x <4 x i32 >] zeroinitializer , align 16
7
7
@"vecData" = external addrspace (3 ) global <4 x i32 >, align 4
8
8
@staticArrayOfVecData = internal global [3 x <4 x i32 >] [<4 x i32 > <i32 1 , i32 2 , i32 3 , i32 4 >, <4 x i32 > <i32 5 , i32 6 , i32 7 , i32 8 >, <4 x i32 > <i32 9 , i32 10 , i32 11 , i32 12 >], align 4
9
- @"groushared2dArrayofVectors " = local_unnamed_addr addrspace (3 ) global [3 x [ 3 x <4 x i32 >]] zeroinitializer , align 16
9
+ @"groupshared2dArrayofVectors " = local_unnamed_addr addrspace (3 ) global [3 x [3 x <4 x i32 >]] zeroinitializer , align 16
10
10
11
- ; CHECK: @arrayofVecData.scalarized.1dim = local_unnamed_addr addrspace(3) global [6 x float ] zeroinitializer, align 16
11
+ ; CHECK: @arrayofVecData.scalarized.1dim = local_unnamed_addr addrspace(3) global [8 x i32 ] zeroinitializer, align 16
12
12
; CHECK: @vecData.scalarized = external addrspace(3) global [4 x i32], align 4
13
13
; CHECK: @staticArrayOfVecData.scalarized.1dim = internal global [12 x i32] [i32 1, i32 2, i32 3, i32 4, i32 5, i32 6, i32 7, i32 8, i32 9, i32 10, i32 11, i32 12], align 4
14
- ; CHECK: @groushared2dArrayofVectors .scalarized.1dim = local_unnamed_addr addrspace(3) global [36 x i32] zeroinitializer, align 16
14
+ ; CHECK: @groupshared2dArrayofVectors .scalarized.1dim = local_unnamed_addr addrspace(3) global [36 x i32] zeroinitializer, align 16
15
15
16
16
; CHECK-NOT: @arrayofVecData
17
17
; CHECK-NOT: @arrayofVecData.scalarized
18
18
; CHECK-NOT: @vecData
19
19
; CHECK-NOT: @staticArrayOfVecData
20
20
; CHECK-NOT: @staticArrayOfVecData.scalarized
21
- ; CHECK-NOT: @groushared2dArrayofVectors
22
- ; CHECK-NOT: @groushared2dArrayofVectors .scalarized
21
+ ; CHECK-NOT: @groupshared2dArrayofVectors
22
+ ; CHECK-NOT: @groupshared2dArrayofVectors .scalarized
23
23
24
24
define <4 x i32 > @load_array_vec_test () #0 {
25
25
; CHECK-LABEL: define <4 x i32> @load_array_vec_test(
26
26
; CHECK-SAME: ) #[[ATTR0:[0-9]+]] {
27
- ; CHECK-NEXT: [[TMP1:%.*]] = bitcast ptr addrspace(3) @arrayofVecData.scalarized.1dim to ptr addrspace(3)
28
- ; CHECK-NEXT: [[TMP2:%.*]] = load i32, ptr addrspace(3) [[TMP1]], align 4
29
- ; CHECK-NEXT: [[TMP3:%.*]] = bitcast ptr addrspace(3) getelementptr (i32, ptr addrspace(3) @arrayofVecData.scalarized.1dim, i32 1) to ptr addrspace(3)
30
- ; CHECK-NEXT: [[TMP4:%.*]] = load i32, ptr addrspace(3) [[TMP3]], align 4
31
- ; CHECK-NEXT: [[TMP5:%.*]] = bitcast ptr addrspace(3) getelementptr (i32, ptr addrspace(3) @arrayofVecData.scalarized.1dim, i32 2) to ptr addrspace(3)
32
- ; CHECK-NEXT: [[TMP6:%.*]] = load i32, ptr addrspace(3) [[TMP5]], align 4
33
- ; CHECK-NEXT: [[TMP7:%.*]] = bitcast ptr addrspace(3) getelementptr (i32, ptr addrspace(3) @arrayofVecData.scalarized.1dim, i32 3) to ptr addrspace(3)
34
- ; CHECK-NEXT: [[TMP8:%.*]] = load i32, ptr addrspace(3) [[TMP7]], align 4
35
- ; CHECK-NEXT: [[TMP9:%.*]] = bitcast ptr addrspace(3) getelementptr inbounds ([6 x float], ptr addrspace(3) @arrayofVecData.scalarized.1dim, i32 0, i32 1) to ptr addrspace(3)
36
- ; CHECK-NEXT: [[TMP10:%.*]] = load i32, ptr addrspace(3) [[TMP9]], align 4
37
- ; CHECK-NEXT: [[TMP11:%.*]] = bitcast ptr addrspace(3) getelementptr (i32, ptr addrspace(3) getelementptr inbounds ([6 x float], ptr addrspace(3) @arrayofVecData.scalarized.1dim, i32 0, i32 1), i32 1) to ptr addrspace(3)
38
- ; CHECK-NEXT: [[TMP12:%.*]] = load i32, ptr addrspace(3) [[TMP11]], align 4
39
- ; CHECK-NEXT: [[TMP13:%.*]] = bitcast ptr addrspace(3) getelementptr (i32, ptr addrspace(3) getelementptr inbounds ([6 x float], ptr addrspace(3) @arrayofVecData.scalarized.1dim, i32 0, i32 1), i32 2) to ptr addrspace(3)
40
- ; CHECK-NEXT: [[TMP14:%.*]] = load i32, ptr addrspace(3) [[TMP13]], align 4
41
- ; CHECK-NEXT: [[TMP15:%.*]] = bitcast ptr addrspace(3) getelementptr (i32, ptr addrspace(3) getelementptr inbounds ([6 x float], ptr addrspace(3) @arrayofVecData.scalarized.1dim, i32 0, i32 1), i32 3) to ptr addrspace(3)
42
- ; CHECK-NEXT: [[TMP16:%.*]] = load i32, ptr addrspace(3) [[TMP15]], align 4
27
+ ; CHECK-NEXT: [[TMP2:%.*]] = load i32, ptr addrspace(3) @arrayofVecData.scalarized.1dim, align 4
28
+ ; CHECK-NEXT: [[TMP4:%.*]] = load i32, ptr addrspace(3) getelementptr (i32, ptr addrspace(3) @arrayofVecData.scalarized.1dim, i32 1), align 4
29
+ ; CHECK-NEXT: [[TMP6:%.*]] = load i32, ptr addrspace(3) getelementptr (i32, ptr addrspace(3) @arrayofVecData.scalarized.1dim, i32 2), align 4
30
+ ; CHECK-NEXT: [[TMP8:%.*]] = load i32, ptr addrspace(3) getelementptr (i32, ptr addrspace(3) @arrayofVecData.scalarized.1dim, i32 3), align 4
31
+ ; CHECK-NEXT: [[TMP10:%.*]] = load i32, ptr addrspace(3) getelementptr inbounds ([8 x i32], ptr addrspace(3) @arrayofVecData.scalarized.1dim, i32 0, i32 4), align 4
32
+ ; CHECK-NEXT: [[TMP12:%.*]] = load i32, ptr addrspace(3) getelementptr (i32, ptr addrspace(3) getelementptr inbounds ([8 x i32], ptr addrspace(3) @arrayofVecData.scalarized.1dim, i32 0, i32 4), i32 1), align 4
33
+ ; CHECK-NEXT: [[TMP14:%.*]] = load i32, ptr addrspace(3) getelementptr (i32, ptr addrspace(3) getelementptr inbounds ([8 x i32], ptr addrspace(3) @arrayofVecData.scalarized.1dim, i32 0, i32 4), i32 2), align 4
34
+ ; CHECK-NEXT: [[TMP16:%.*]] = load i32, ptr addrspace(3) getelementptr (i32, ptr addrspace(3) getelementptr inbounds ([8 x i32], ptr addrspace(3) @arrayofVecData.scalarized.1dim, i32 0, i32 4), i32 3), align 4
43
35
; CHECK-NEXT: [[DOTI05:%.*]] = add i32 [[TMP2]], [[TMP10]]
44
36
; CHECK-NEXT: [[DOTI16:%.*]] = add i32 [[TMP4]], [[TMP12]]
45
37
; CHECK-NEXT: [[DOTI27:%.*]] = add i32 [[TMP6]], [[TMP14]]
@@ -77,7 +69,9 @@ define <4 x i32> @load_vec_test() #0 {
77
69
define <4 x i32 > @load_static_array_of_vec_test (i32 %index ) #0 {
78
70
; CHECK-LABEL: define <4 x i32> @load_static_array_of_vec_test(
79
71
; CHECK-SAME: i32 [[INDEX:%.*]]) #[[ATTR0]] {
80
- ; CHECK-NEXT: [[DOTFLAT:%.*]] = getelementptr inbounds [12 x i32], ptr @staticArrayOfVecData.scalarized.1dim, i32 0, i32 [[INDEX]]
72
+ ; CHECK-NEXT: [[TMP3:%.*]] = mul i32 [[INDEX]], 4
73
+ ; CHECK-NEXT: [[TMP2:%.*]] = add i32 0, [[TMP3]]
74
+ ; CHECK-NEXT: [[DOTFLAT:%.*]] = getelementptr inbounds [12 x i32], ptr @staticArrayOfVecData.scalarized.1dim, i32 0, i32 [[TMP2]]
81
75
; CHECK-NEXT: [[DOTI0:%.*]] = load i32, ptr [[DOTFLAT]], align 4
82
76
; CHECK-NEXT: [[DOTFLAT_I1:%.*]] = getelementptr i32, ptr [[DOTFLAT]], i32 1
83
77
; CHECK-NEXT: [[DOTI1:%.*]] = load i32, ptr [[DOTFLAT_I1]], align 4
@@ -99,14 +93,14 @@ define <4 x i32> @load_static_array_of_vec_test(i32 %index) #0 {
99
93
define <4 x i32 > @multid_load_test () #0 {
100
94
; CHECK-LABEL: define <4 x i32> @multid_load_test(
101
95
; CHECK-SAME: ) #[[ATTR0]] {
102
- ; CHECK-NEXT: [[TMP1:%.*]] = load i32, ptr addrspace(3) @groushared2dArrayofVectors .scalarized.1dim, align 4
103
- ; CHECK-NEXT: [[TMP2:%.*]] = load i32, ptr addrspace(3) getelementptr (i32, ptr addrspace(3) @groushared2dArrayofVectors .scalarized.1dim, i32 1), align 4
104
- ; CHECK-NEXT: [[TMP3:%.*]] = load i32, ptr addrspace(3) getelementptr (i32, ptr addrspace(3) @groushared2dArrayofVectors .scalarized.1dim, i32 2), align 4
105
- ; CHECK-NEXT: [[TMP4:%.*]] = load i32, ptr addrspace(3) getelementptr (i32, ptr addrspace(3) @groushared2dArrayofVectors .scalarized.1dim, i32 3), align 4
106
- ; CHECK-NEXT: [[TMP5:%.*]] = load i32, ptr addrspace(3) getelementptr inbounds ([36 x i32], ptr addrspace(3) @groushared2dArrayofVectors .scalarized.1dim, i32 0, i32 4 ), align 4
107
- ; CHECK-NEXT: [[DOTI13:%.*]] = load i32, ptr addrspace(3) getelementptr (i32, ptr addrspace(3) getelementptr inbounds ([36 x i32], ptr addrspace(3) @groushared2dArrayofVectors .scalarized.1dim, i32 0, i32 4 ), i32 1), align 4
108
- ; CHECK-NEXT: [[DOTI25:%.*]] = load i32, ptr addrspace(3) getelementptr (i32, ptr addrspace(3) getelementptr inbounds ([36 x i32], ptr addrspace(3) @groushared2dArrayofVectors .scalarized.1dim, i32 0, i32 4 ), i32 2), align 4
109
- ; CHECK-NEXT: [[DOTI37:%.*]] = load i32, ptr addrspace(3) getelementptr (i32, ptr addrspace(3) getelementptr inbounds ([36 x i32], ptr addrspace(3) @groushared2dArrayofVectors .scalarized.1dim, i32 0, i32 4 ), i32 3), align 4
96
+ ; CHECK-NEXT: [[TMP1:%.*]] = load i32, ptr addrspace(3) @groupshared2dArrayofVectors .scalarized.1dim, align 4
97
+ ; CHECK-NEXT: [[TMP2:%.*]] = load i32, ptr addrspace(3) getelementptr (i32, ptr addrspace(3) @groupshared2dArrayofVectors .scalarized.1dim, i32 1), align 4
98
+ ; CHECK-NEXT: [[TMP3:%.*]] = load i32, ptr addrspace(3) getelementptr (i32, ptr addrspace(3) @groupshared2dArrayofVectors .scalarized.1dim, i32 2), align 4
99
+ ; CHECK-NEXT: [[TMP4:%.*]] = load i32, ptr addrspace(3) getelementptr (i32, ptr addrspace(3) @groupshared2dArrayofVectors .scalarized.1dim, i32 3), align 4
100
+ ; CHECK-NEXT: [[TMP5:%.*]] = load i32, ptr addrspace(3) getelementptr inbounds ([36 x i32], ptr addrspace(3) @groupshared2dArrayofVectors .scalarized.1dim, i32 0, i32 16 ), align 4
101
+ ; CHECK-NEXT: [[DOTI13:%.*]] = load i32, ptr addrspace(3) getelementptr (i32, ptr addrspace(3) getelementptr inbounds ([36 x i32], ptr addrspace(3) @groupshared2dArrayofVectors .scalarized.1dim, i32 0, i32 16 ), i32 1), align 4
102
+ ; CHECK-NEXT: [[DOTI25:%.*]] = load i32, ptr addrspace(3) getelementptr (i32, ptr addrspace(3) getelementptr inbounds ([36 x i32], ptr addrspace(3) @groupshared2dArrayofVectors .scalarized.1dim, i32 0, i32 16 ), i32 2), align 4
103
+ ; CHECK-NEXT: [[DOTI37:%.*]] = load i32, ptr addrspace(3) getelementptr (i32, ptr addrspace(3) getelementptr inbounds ([36 x i32], ptr addrspace(3) @groupshared2dArrayofVectors .scalarized.1dim, i32 0, i32 16 ), i32 3), align 4
110
104
; CHECK-NEXT: [[DOTI08:%.*]] = add i32 [[TMP1]], [[TMP5]]
111
105
; CHECK-NEXT: [[DOTI19:%.*]] = add i32 [[TMP2]], [[DOTI13]]
112
106
; CHECK-NEXT: [[DOTI210:%.*]] = add i32 [[TMP3]], [[DOTI25]]
@@ -117,8 +111,8 @@ define <4 x i32> @multid_load_test() #0 {
117
111
; CHECK-NEXT: [[TMP6:%.*]] = insertelement <4 x i32> [[DOTUPTO217]], i32 [[DOTI311]], i32 3
118
112
; CHECK-NEXT: ret <4 x i32> [[TMP6]]
119
113
;
120
- %1 = load <4 x i32 >, <4 x i32 > addrspace (3 )* getelementptr inbounds ([3 x [3 x <4 x i32 >]], [3 x [3 x <4 x i32 >]] addrspace (3 )* @"groushared2dArrayofVectors " , i32 0 , i32 0 , i32 0 ), align 4
121
- %2 = load <4 x i32 >, <4 x i32 > addrspace (3 )* getelementptr inbounds ([3 x [3 x <4 x i32 >]], [3 x [3 x <4 x i32 >]] addrspace (3 )* @"groushared2dArrayofVectors " , i32 0 , i32 1 , i32 1 ), align 4
114
+ %1 = load <4 x i32 >, <4 x i32 > addrspace (3 )* getelementptr inbounds ([3 x [3 x <4 x i32 >]], [3 x [3 x <4 x i32 >]] addrspace (3 )* @"groupshared2dArrayofVectors " , i32 0 , i32 0 , i32 0 ), align 4
115
+ %2 = load <4 x i32 >, <4 x i32 > addrspace (3 )* getelementptr inbounds ([3 x [3 x <4 x i32 >]], [3 x [3 x <4 x i32 >]] addrspace (3 )* @"groupshared2dArrayofVectors " , i32 0 , i32 1 , i32 1 ), align 4
122
116
%3 = add <4 x i32 > %1 , %2
123
117
ret <4 x i32 > %3
124
118
}
0 commit comments