@@ -2218,11 +2218,11 @@ void ldmatrix(uintptr_t addr, T *m1, T *m2, T *m3, T *m4, bool trans = false) {
2218
2218
ldmatrix (addr, m4, trans, 3 );
2219
2219
}
2220
2220
2221
- // / Stores 1 8x8 b16 matrix from local memory to shared memory (32-bits per wi)
2221
+ // / Stores 1 8x8 b16 matrix from private memory to local memory (32-bits per wi)
2222
2222
// / Requires the sub-group size of kernel calling this function to be 32
2223
2223
// / \tparam [in] T The type of matrix elements
2224
- // / \param [in] addr The address of the matrix in shared memory
2225
- // / \param [in] m The local memory containing data of matrix
2224
+ // / \param [in] addr The address of the matrix in local memory
2225
+ // / \param [in] m The private memory containing data of matrix
2226
2226
// / \param [in] item The sycl::nd_item index space class
2227
2227
// / \param [in] trans Indicates whether the matrix to be stored transposed
2228
2228
// / \param [in] mat The matrix index to be stored
@@ -2273,12 +2273,12 @@ void stmatrix(uintptr_t addr, T m, const ItemT &item, bool trans = false,
2273
2273
}
2274
2274
}
2275
2275
2276
- // / Stores 2 8x8 b16 matrix from local memory to shared memory (32-bits per wi)
2276
+ // / Stores 2 8x8 b16 matrix from private memory to local memory (32-bits per wi)
2277
2277
// / Requires the sub-group size of kernel calling this function to be 32
2278
2278
// / \tparam [in] T The type of matrix elements
2279
- // / \param [in] addr The address of the matrix in shared memory
2280
- // / \param [in] m1 The local memory containing data of 1st matrix
2281
- // / \param [in] m2 The local memory containing data of 2nd matrix
2279
+ // / \param [in] addr The address of the matrix in local memory
2280
+ // / \param [in] m1 The private memory containing data of 1st matrix
2281
+ // / \param [in] m2 The private memory containing data of 2nd matrix
2282
2282
// / \param [in] item The sycl::nd_item index space class
2283
2283
// / \param [in] trans Indicates whether the matrix to be stored transposed
2284
2284
template <typename T, typename ItemT>
@@ -2290,14 +2290,14 @@ void stmatrix(uintptr_t addr, T m1, T m2, const ItemT &item,
2290
2290
stmatrix (addr, m2, item, trans, 1 );
2291
2291
}
2292
2292
2293
- // / Stores 4 8x8 b16 matrix from local memory to shared memory (32-bits per wi)
2293
+ // / Stores 4 8x8 b16 matrix from private memory to local memory (32-bits per wi)
2294
2294
// / Requires the sub-group size of kernel calling this function to be 32
2295
2295
// / \tparam [in] T The type of matrix elements
2296
- // / \param [in] addr The address of the matrix in shared memory
2297
- // / \param [in] m1 The local memory containing data of 1st matrix
2298
- // / \param [in] m2 The local memory containing data of 2nd matrix
2299
- // / \param [in] m3 The local memory containing data of 3rd matrix
2300
- // / \param [in] m4 The local memory containing data of 4th matrix
2296
+ // / \param [in] addr The address of the matrix in local memory
2297
+ // / \param [in] m1 The private memory containing data of 1st matrix
2298
+ // / \param [in] m2 The private memory containing data of 2nd matrix
2299
+ // / \param [in] m3 The private memory containing data of 3rd matrix
2300
+ // / \param [in] m4 The private memory containing data of 4th matrix
2301
2301
// / \param [in] item The sycl::nd_item index space class
2302
2302
// / \param [in] trans Indicates whether the matrix to be stored transposed
2303
2303
template <typename T, typename ItemT>
0 commit comments