@@ -2218,11 +2218,11 @@ void ldmatrix(uintptr_t addr, T *m1, T *m2, T *m3, T *m4, bool trans = false) {
22182218 ldmatrix (addr, m4, trans, 3 );
22192219}
22202220
2221- // / Stores 1 8x8 b16 matrix from local memory to shared memory (32-bits per wi)
2221+ // / Stores 1 8x8 b16 matrix from private memory to local memory (32-bits per wi)
22222222// / Requires the sub-group size of kernel calling this function to be 32
22232223// / \tparam [in] T The type of matrix elements
2224- // / \param [in] addr The address of the matrix in shared memory
2225- // / \param [in] m The local memory containing data of matrix
2224+ // / \param [in] addr The address of the matrix in local memory
2225+ // / \param [in] m The private memory containing data of matrix
22262226// / \param [in] item The sycl::nd_item index space class
22272227// / \param [in] trans Indicates whether the matrix to be stored transposed
22282228// / \param [in] mat The matrix index to be stored
@@ -2273,12 +2273,12 @@ void stmatrix(uintptr_t addr, T m, const ItemT &item, bool trans = false,
22732273 }
22742274}
22752275
2276- // / Stores 2 8x8 b16 matrix from local memory to shared memory (32-bits per wi)
2276+ // / Stores 2 8x8 b16 matrix from private memory to local memory (32-bits per wi)
22772277// / Requires the sub-group size of kernel calling this function to be 32
22782278// / \tparam [in] T The type of matrix elements
2279- // / \param [in] addr The address of the matrix in shared memory
2280- // / \param [in] m1 The local memory containing data of 1st matrix
2281- // / \param [in] m2 The local memory containing data of 2nd matrix
2279+ // / \param [in] addr The address of the matrix in local memory
2280+ // / \param [in] m1 The private memory containing data of 1st matrix
2281+ // / \param [in] m2 The private memory containing data of 2nd matrix
22822282// / \param [in] item The sycl::nd_item index space class
22832283// / \param [in] trans Indicates whether the matrix to be stored transposed
22842284template <typename T, typename ItemT>
@@ -2290,14 +2290,14 @@ void stmatrix(uintptr_t addr, T m1, T m2, const ItemT &item,
22902290 stmatrix (addr, m2, item, trans, 1 );
22912291}
22922292
2293- // / Stores 4 8x8 b16 matrix from local memory to shared memory (32-bits per wi)
2293+ // / Stores 4 8x8 b16 matrix from private memory to local memory (32-bits per wi)
22942294// / Requires the sub-group size of kernel calling this function to be 32
22952295// / \tparam [in] T The type of matrix elements
2296- // / \param [in] addr The address of the matrix in shared memory
2297- // / \param [in] m1 The local memory containing data of 1st matrix
2298- // / \param [in] m2 The local memory containing data of 2nd matrix
2299- // / \param [in] m3 The local memory containing data of 3rd matrix
2300- // / \param [in] m4 The local memory containing data of 4th matrix
2296+ // / \param [in] addr The address of the matrix in local memory
2297+ // / \param [in] m1 The private memory containing data of 1st matrix
2298+ // / \param [in] m2 The private memory containing data of 2nd matrix
2299+ // / \param [in] m3 The private memory containing data of 3rd matrix
2300+ // / \param [in] m4 The private memory containing data of 4th matrix
23012301// / \param [in] item The sycl::nd_item index space class
23022302// / \param [in] trans Indicates whether the matrix to be stored transposed
23032303template <typename T, typename ItemT>
0 commit comments