3
3
//CHECK: #map = affine_map<()[s0] -> (s0 floordiv 4)>
4
4
//CHECK: #map1 = affine_map<()[s0] -> (s0 mod 4)>
5
5
gpu.module @test_1_1_assignment {
6
- // CHECK-LABEL: test_create_nd_tdesc
6
+ // CHECK-LABEL: create_nd_tdesc
7
7
// CHECK-SAME: %[[ARG_0:.*]]: memref<24x32xf32>
8
- gpu.func @test_create_nd_tdesc (%src: memref <24 x32 xf32 >) {
8
+ gpu.func @create_nd_tdesc (%src: memref <24 x32 xf32 >) {
9
9
// CHECK: %[[SGID:.*]] = gpu.subgroup_id
10
10
// CHECK: %[[C12:.*]] = arith.constant 12 : index
11
11
// CHECK: %[[C4:.*]] = arith.constant 4 : index
@@ -30,9 +30,9 @@ gpu.module @test_1_1_assignment {
30
30
gpu.return
31
31
}
32
32
33
- // CHECK-LABEL: test_load_nd_tdesc
33
+ // CHECK-LABEL: load_nd_tdesc
34
34
// CHECK-SAME: %[[ARG_0:.*]]: memref<24x32xf32>
35
- gpu.func @test_load_nd_tdesc (%src: memref <24 x32 xf32 >) {
35
+ gpu.func @load_nd_tdesc (%src: memref <24 x32 xf32 >) {
36
36
// CHECK: %[[TDESC:.*]] = xegpu.create_nd_tdesc %[[ARG_0]][{{%.*}}, {{%.*}}] : memref<24x32xf32>
37
37
// CHECK-SAME: -> !xegpu.tensor_desc<12x8xf32, #xegpu.layout<lane_layout = [2, 8], lane_data = [1, 1]>>
38
38
// CHECK: %[[LOAD:.*]] = xegpu.load_nd %[[TDESC]]
@@ -46,9 +46,9 @@ gpu.module @test_1_1_assignment {
46
46
gpu.return
47
47
}
48
48
49
- // CHECK-LABEL: test_store_nd
49
+ // CHECK-LABEL: store_nd
50
50
// CHECK-SAME: %[[ARG_0:.*]]: memref<24x32xf32>
51
- gpu.func @test_store_nd (%src: memref <24 x32 xf32 >) {
51
+ gpu.func @store_nd (%src: memref <24 x32 xf32 >) {
52
52
// CHECK: %[[TDESC:.*]] = xegpu.create_nd_tdesc %[[ARG_0]][{{%.*}}, {{%.*}}] : memref<24x32xf32>
53
53
// CHECK-SAME: -> !xegpu.tensor_desc<12x8xf32, #xegpu.layout<lane_layout = [2, 8], lane_data = [1, 1]>>
54
54
// CHECK: %[[LOAD:.*]] = xegpu.load_nd %[[TDESC]]
@@ -66,9 +66,9 @@ gpu.module @test_1_1_assignment {
66
66
gpu.return
67
67
}
68
68
69
- // CHECK-LABEL: test_update_nd
69
+ // CHECK-LABEL: update_nd
70
70
// CHECK-SAME: %[[ARG_0:.*]]: memref<24x32xf32>
71
- gpu.func @test_update_nd (%src: memref <24 x32 xf32 >){
71
+ gpu.func @update_nd (%src: memref <24 x32 xf32 >){
72
72
// CHECK: %[[TDESC:.*]] = xegpu.create_nd_tdesc %[[ARG_0]][{{%.*}}, {{%.*}}] : memref<24x32xf32>
73
73
// CHECK-SAME: -> !xegpu.tensor_desc<12x8xf32, #xegpu.layout<lane_layout = [2, 8], lane_data = [1, 1]>>
74
74
// CHECK: %[[UPDATE:.*]] = xegpu.update_nd_offset %[[TDESC]], [0, 16]
@@ -80,10 +80,10 @@ gpu.func @test_update_nd(%src: memref<24x32xf32>){
80
80
gpu.return
81
81
}
82
82
83
- // CHECK-LABEL: test_dpas
83
+ // CHECK-LABEL: dpas
84
84
// CHECK-SAME: %[[ARG_0:.*]]: memref<24x32xf32>
85
85
// CHECK-SAME: %[[ARG_1:.*]]: memref<32x24xf32>
86
- gpu.func @test_dpas (%a: memref <24 x32 xf32 >, %b: memref <32 x24 xf32 >) {
86
+ gpu.func @dpas (%a: memref <24 x32 xf32 >, %b: memref <32 x24 xf32 >) {
87
87
// CHECK: %[[TDESC_A:.*]] = xegpu.create_nd_tdesc %[[ARG_0]][{{%.*}}, {{%.*}}] : memref<24x32xf32>
88
88
// CHECk-SAME: -> !xegpu.tensor_desc<12x8xf32, #xegpu.layout<lane_layout = [2, 8], lane_data = [1, 1]>>
89
89
// CHECK: %[[LOAD_A:.*]] = xegpu.load_nd %[[TDESC_A]]
@@ -114,10 +114,10 @@ gpu.func @test_dpas(%a: memref<24x32xf32>, %b: memref<32x24xf32>) {
114
114
}
115
115
116
116
117
- // CHECK-LABEL: test_dpas_no_sg_data
117
+ // CHECK-LABEL: dpas_no_sg_data
118
118
// CHECK-SAME: %[[ARG_0:.*]]: memref<24x32xf32>
119
119
// CHECK-SAME: %[[ARG_1:.*]]: memref<32x24xf32>
120
- gpu.func @test_dpas_no_sg_data (%a: memref <24 x32 xf32 >, %b: memref <32 x24 xf32 >) {
120
+ gpu.func @dpas_no_sg_data (%a: memref <24 x32 xf32 >, %b: memref <32 x24 xf32 >) {
121
121
// CHECK: %[[TDESC_A:.*]] = xegpu.create_nd_tdesc %[[ARG_0]][{{%.*}}, {{%.*}}] : memref<24x32xf32>
122
122
// CHECk-SAME: -> !xegpu.tensor_desc<12x8xf32, #xegpu.layout<lane_layout = [2, 8], lane_data = [1, 1]>>
123
123
// CHECK: %[[LOAD_A:.*]] = xegpu.load_nd %[[TDESC_A]]
@@ -147,9 +147,9 @@ gpu.func @test_dpas_no_sg_data(%a: memref<24x32xf32>, %b: memref<32x24xf32>) {
147
147
gpu.return
148
148
}
149
149
150
- // CHECK-LABEL: test_prefetch_nd_tdesc
150
+ // CHECK-LABEL: prefetch_nd_tdesc
151
151
// CHECK-SAME: %[[ARG_0:.*]]: memref<24x32xf32>
152
- gpu.func @test_prefetch_nd_tdesc (%src: memref <24 x32 xf32 >) {
152
+ gpu.func @prefetch_nd_tdesc (%src: memref <24 x32 xf32 >) {
153
153
// CHECK: %[[TDESC:.*]] = xegpu.create_nd_tdesc %[[ARG_0]][{{%.*}}, {{%.*}}] : memref<24x32xf32>
154
154
// CHECK-SAME: -> !xegpu.tensor_desc<12x8xf32, #xegpu.layout<lane_layout = [2, 8], lane_data = [1, 1]>>
155
155
// CHECK: xegpu.prefetch_nd %[[TDESC]]
@@ -161,16 +161,16 @@ gpu.func @test_dpas_no_sg_data(%a: memref<24x32xf32>, %b: memref<32x24xf32>) {
161
161
gpu.return
162
162
}
163
163
164
- // CHECK-LABEL: test_dpas_with_no_create_nd_desc
165
- gpu.func @test_dpas_with_no_create_nd_desc (%a: vector <24 x32 xf32 >, %b: vector <32 x24 xf32 >) {
164
+ // CHECK-LABEL: dpas_with_no_create_nd_desc
165
+ gpu.func @dpas_with_no_create_nd_desc (%a: vector <24 x32 xf32 >, %b: vector <32 x24 xf32 >) {
166
166
// CHECK-NOT: vector<12x12xf32>
167
167
%dpas = xegpu.dpas %a , %b
168
168
{layout = #xegpu.layout <sg_layout = [2 , 2 ], sg_data = [12 , 12 ], lane_layout = [2 , 2 ], lane_data = [1 , 1 ]>}
169
169
: vector <24 x32 xf32 >, vector <32 x24 xf32 > -> vector <24 x24 xf32 >
170
170
gpu.return
171
171
}
172
172
173
- gpu.func @test_scf_for (%arg0: memref <1024 x1024 xf16 >, %arg1: memref <1024 x1024 xf16 >, %arg2: memref <1024 x1024 xf32 >) {
173
+ gpu.func @scf_for (%arg0: memref <1024 x1024 xf16 >, %arg1: memref <1024 x1024 xf16 >, %arg2: memref <1024 x1024 xf32 >) {
174
174
//CHECK: [[c0:%.+]] = arith.constant 0 : index
175
175
//CHECK: [[c128:%.+]] = arith.constant 128 : index
176
176
//CHECK: [[c1024:%.+]] = arith.constant 1024 : index
@@ -213,7 +213,7 @@ gpu.func @test_dpas_no_sg_data(%a: memref<24x32xf32>, %b: memref<32x24xf32>) {
213
213
gpu.return
214
214
}
215
215
216
- gpu.func @test_scf_while_and_condition (%arg0: memref <1024 xf32 >, %arg1: memref <1024 xf32 >) {
216
+ gpu.func @scf_while_and_condition (%arg0: memref <1024 xf32 >, %arg1: memref <1024 xf32 >) {
217
217
%c1_i32 = arith.constant 1 : i32
218
218
%c10_i32 = arith.constant 10 : i32
219
219
%c0_i32 = arith.constant 0 : i32
@@ -238,7 +238,7 @@ gpu.func @test_dpas_no_sg_data(%a: memref<24x32xf32>, %b: memref<32x24xf32>) {
238
238
gpu.return
239
239
}
240
240
241
- gpu.func @test_scf_if (%arg0: memref <1024 xf32 >, %arg1: memref <1024 xf32 >) {
241
+ gpu.func @scf_if (%arg0: memref <1024 xf32 >, %arg1: memref <1024 xf32 >) {
242
242
%c10 = arith.constant 10 : index
243
243
%id = gpu.subgroup_id : index
244
244
@@ -267,7 +267,7 @@ gpu.func @test_dpas_no_sg_data(%a: memref<24x32xf32>, %b: memref<32x24xf32>) {
267
267
gpu.return
268
268
}
269
269
270
- gpu.func @test_scf_if_tensor_desc (%arg0: memref <1024 xf32 >, %arg1: memref <1024 xf32 >) {
270
+ gpu.func @scf_if_tensor_desc (%arg0: memref <1024 xf32 >, %arg1: memref <1024 xf32 >) {
271
271
%c10 = arith.constant 10 : index
272
272
%id = gpu.subgroup_id : index
273
273
0 commit comments