diff --git a/src/ATen/native/xpu/sycl/LinearInt4.cpp b/src/ATen/native/xpu/sycl/LinearInt4.cpp index 846fd3530..9378187c9 100644 --- a/src/ATen/native/xpu/sycl/LinearInt4.cpp +++ b/src/ATen/native/xpu/sycl/LinearInt4.cpp @@ -39,7 +39,8 @@ struct LinearInt4KernelFunctor : public __SYCL_KER_CONFIG_CONVENTION__ { ldc(ldc) {} void sycl_ker_config_convention(sycl::handler& cgh) {} - void operator()(sycl::nd_item<1> it) const { + [[intel::reqd_sub_group_size(16)]] void operator()( + sycl::nd_item<1> it) const { int constexpr Unroll = 2; int constexpr SgSize = 16; int constexpr blocksize = block_size;