We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 300a70f commit 3d0f259Copy full SHA for 3d0f259
1 file changed
csrc/xpu_kernels.h
@@ -22,6 +22,7 @@ template <typename T, int TILE_SIZE, int NUM_PER_TH, int DATA_TYPE> class kDequa
22
23
template <typename T, size_t GROUP_SIZE, size_t NUM_PER_THREAD, size_t SUBG_SIZE, int BITS> class kgemv_4bit_inference {
24
public:
25
+ [[sycl::reqd_sub_group_size(SUBG_SIZE)]]
26
SYCL_EXTERNAL void operator()(sycl::nd_item<1> item) const;
27
28
kgemv_4bit_inference(
0 commit comments