@@ -2056,11 +2056,11 @@ class joint_matrix {
2056
2056
const size_t num_elements;
2057
2057
};
2058
2058
2059
- // / Stores 1 8x8 b16 matrix from local memory to shared memory (32-bits per wi)
2059
+ // / Stores 1 8x8 b16 matrix from private memory to local memory (32-bits per wi)
2060
2060
// / Requires the sub-group size of kernel calling this function to be 32
2061
2061
// / \tparam [in] T The type of matrix elements
2062
- // / \param [in] addr The address of the matrix in shared memory
2063
- // / \param [in] m The local memory containing data of matrix
2062
+ // / \param [in] addr The address of the matrix in local memory
2063
+ // / \param [in] m The private memory containing data of matrix
2064
2064
// / \param [in] item The sycl::nd_item index space class
2065
2065
// / \param [in] trans Indicates whether the matrix to be stored transposed
2066
2066
// / \param [in] mat The matrix index to be stored
@@ -2111,12 +2111,12 @@ void stmatrix(uintptr_t addr, T m, const ItemT &item, bool trans = false,
2111
2111
}
2112
2112
}
2113
2113
2114
- // / Stores 2 8x8 b16 matrix from local memory to shared memory (32-bits per wi)
2114
+ // / Stores 2 8x8 b16 matrix from private memory to local memory (32-bits per wi)
2115
2115
// / Requires the sub-group size of kernel calling this function to be 32
2116
2116
// / \tparam [in] T The type of matrix elements
2117
- // / \param [in] addr The address of the matrix in shared memory
2118
- // / \param [in] m1 The local memory containing data of 1st matrix
2119
- // / \param [in] m2 The local memory containing data of 2nd matrix
2117
+ // / \param [in] addr The address of the matrix in local memory
2118
+ // / \param [in] m1 The private memory containing data of 1st matrix
2119
+ // / \param [in] m2 The private memory containing data of 2nd matrix
2120
2120
// / \param [in] item The sycl::nd_item index space class
2121
2121
// / \param [in] trans Indicates whether the matrix to be stored transposed
2122
2122
template <typename T, typename ItemT>
@@ -2128,14 +2128,14 @@ void stmatrix(uintptr_t addr, T m1, T m2, const ItemT &item,
2128
2128
stmatrix (addr, m2, item, trans, 1 );
2129
2129
}
2130
2130
2131
- // / Stores 4 8x8 b16 matrix from local memory to shared memory (32-bits per wi)
2131
+ // / Stores 4 8x8 b16 matrix from private memory to local memory (32-bits per wi)
2132
2132
// / Requires the sub-group size of kernel calling this function to be 32
2133
2133
// / \tparam [in] T The type of matrix elements
2134
- // / \param [in] addr The address of the matrix in shared memory
2135
- // / \param [in] m1 The local memory containing data of 1st matrix
2136
- // / \param [in] m2 The local memory containing data of 2nd matrix
2137
- // / \param [in] m3 The local memory containing data of 3rd matrix
2138
- // / \param [in] m4 The local memory containing data of 4th matrix
2134
+ // / \param [in] addr The address of the matrix in local memory
2135
+ // / \param [in] m1 The private memory containing data of 1st matrix
2136
+ // / \param [in] m2 The private memory containing data of 2nd matrix
2137
+ // / \param [in] m3 The private memory containing data of 3rd matrix
2138
+ // / \param [in] m4 The private memory containing data of 4th matrix
2139
2139
// / \param [in] item The sycl::nd_item index space class
2140
2140
// / \param [in] trans Indicates whether the matrix to be stored transposed
2141
2141
template <typename T, typename ItemT>
0 commit comments