@@ -2056,11 +2056,11 @@ class joint_matrix {
20562056 const size_t num_elements;
20572057};
20582058
2059- // / Stores 1 8x8 b16 matrix from local memory to shared memory (32-bits per wi)
2059+ // / Stores 1 8x8 b16 matrix from private memory to local memory (32-bits per wi)
20602060// / Requires the sub-group size of kernel calling this function to be 32
20612061// / \tparam [in] T The type of matrix elements
2062- // / \param [in] addr The address of the matrix in shared memory
2063- // / \param [in] m The local memory containing data of matrix
2062+ // / \param [in] addr The address of the matrix in local memory
2063+ // / \param [in] m The private memory containing data of matrix
20642064// / \param [in] item The sycl::nd_item index space class
20652065// / \param [in] trans Indicates whether the matrix to be stored transposed
20662066// / \param [in] mat The matrix index to be stored
@@ -2111,12 +2111,12 @@ void stmatrix(uintptr_t addr, T m, const ItemT &item, bool trans = false,
21112111 }
21122112}
21132113
2114- // / Stores 2 8x8 b16 matrix from local memory to shared memory (32-bits per wi)
2114+ // / Stores 2 8x8 b16 matrix from private memory to local memory (32-bits per wi)
21152115// / Requires the sub-group size of kernel calling this function to be 32
21162116// / \tparam [in] T The type of matrix elements
2117- // / \param [in] addr The address of the matrix in shared memory
2118- // / \param [in] m1 The local memory containing data of 1st matrix
2119- // / \param [in] m2 The local memory containing data of 2nd matrix
2117+ // / \param [in] addr The address of the matrix in local memory
2118+ // / \param [in] m1 The private memory containing data of 1st matrix
2119+ // / \param [in] m2 The private memory containing data of 2nd matrix
21202120// / \param [in] item The sycl::nd_item index space class
21212121// / \param [in] trans Indicates whether the matrix to be stored transposed
21222122template <typename T, typename ItemT>
@@ -2128,14 +2128,14 @@ void stmatrix(uintptr_t addr, T m1, T m2, const ItemT &item,
21282128 stmatrix (addr, m2, item, trans, 1 );
21292129}
21302130
2131- // / Stores 4 8x8 b16 matrix from local memory to shared memory (32-bits per wi)
2131+ // / Stores 4 8x8 b16 matrix from private memory to local memory (32-bits per wi)
21322132// / Requires the sub-group size of kernel calling this function to be 32
21332133// / \tparam [in] T The type of matrix elements
2134- // / \param [in] addr The address of the matrix in shared memory
2135- // / \param [in] m1 The local memory containing data of 1st matrix
2136- // / \param [in] m2 The local memory containing data of 2nd matrix
2137- // / \param [in] m3 The local memory containing data of 3rd matrix
2138- // / \param [in] m4 The local memory containing data of 4th matrix
2134+ // / \param [in] addr The address of the matrix in local memory
2135+ // / \param [in] m1 The private memory containing data of 1st matrix
2136+ // / \param [in] m2 The private memory containing data of 2nd matrix
2137+ // / \param [in] m3 The private memory containing data of 3rd matrix
2138+ // / \param [in] m4 The private memory containing data of 4th matrix
21392139// / \param [in] item The sycl::nd_item index space class
21402140// / \param [in] trans Indicates whether the matrix to be stored transposed
21412141template <typename T, typename ItemT>
0 commit comments