diff --git a/include/oneapi/dpl/pstl/hetero/dpcpp/parallel_backend_sycl_reduce.h b/include/oneapi/dpl/pstl/hetero/dpcpp/parallel_backend_sycl_reduce.h index aabf829fdcf..3465e1aca97 100644 --- a/include/oneapi/dpl/pstl/hetero/dpcpp/parallel_backend_sycl_reduce.h +++ b/include/oneapi/dpl/pstl/hetero/dpcpp/parallel_backend_sycl_reduce.h @@ -50,7 +50,7 @@ class __reduce_kernel; // Adjust number of sequential operations per work-item based on the vector size. Single elements are kept to // improve performance of small arrays or remainder loops. template <::std::uint8_t _VecSize, typename _Size> -inline _Size +_Size __adjust_iters_per_work_item(_Size __iters_per_work_item) { if (__iters_per_work_item > 1)