diff --git a/include/oneapi/math/blas/detail/generic/blas_ct.hxx b/include/oneapi/math/blas/detail/generic/blas_ct.hxx index 831a654a8..d96f43e62 100644 --- a/include/oneapi/math/blas/detail/generic/blas_ct.hxx +++ b/include/oneapi/math/blas/detail/generic/blas_ct.hxx @@ -23,7 +23,7 @@ void herk(backend_selector selector, uplo upper_lower, transpo std::int64_t n, std::int64_t k, float alpha, sycl::buffer, 1>& a, std::int64_t lda, float beta, sycl::buffer, 1>& c, std::int64_t ldc) { oneapi::math::blas::generic::MAJOR::herk(selector.get_queue(), upper_lower, trans, n, k, alpha, - a, lda, beta, c, ldc); + a, lda, beta, c, ldc); } void herk(backend_selector selector, uplo upper_lower, transpose trans, @@ -31,7 +31,7 @@ void herk(backend_selector selector, uplo upper_lower, transpo std::int64_t lda, double beta, sycl::buffer, 1>& c, std::int64_t ldc) { oneapi::math::blas::generic::MAJOR::herk(selector.get_queue(), upper_lower, trans, n, k, alpha, - a, lda, beta, c, ldc); + a, lda, beta, c, ldc); } void scal(backend_selector selector, std::int64_t n, float alpha, @@ -67,69 +67,69 @@ void scal(backend_selector selector, std::int64_t n, double al void trmv(backend_selector selector, uplo upper_lower, transpose trans, diag unit_diag, std::int64_t n, sycl::buffer& a, std::int64_t lda, sycl::buffer& x, std::int64_t incx) { - oneapi::math::blas::generic::MAJOR::trmv(selector.get_queue(), upper_lower, trans, unit_diag, - n, a, lda, x, incx); + oneapi::math::blas::generic::MAJOR::trmv(selector.get_queue(), upper_lower, trans, unit_diag, n, + a, lda, x, incx); } void trmv(backend_selector selector, uplo upper_lower, transpose trans, diag unit_diag, std::int64_t n, sycl::buffer& a, std::int64_t lda, sycl::buffer& x, std::int64_t incx) { - oneapi::math::blas::generic::MAJOR::trmv(selector.get_queue(), upper_lower, trans, unit_diag, - n, a, lda, x, incx); + oneapi::math::blas::generic::MAJOR::trmv(selector.get_queue(), upper_lower, trans, unit_diag, n, + a, lda, x, incx); } void trmv(backend_selector selector, uplo upper_lower, transpose trans, diag unit_diag, std::int64_t n, sycl::buffer, 1>& a, std::int64_t lda, sycl::buffer, 1>& x, std::int64_t incx) { - oneapi::math::blas::generic::MAJOR::trmv(selector.get_queue(), upper_lower, trans, unit_diag, - n, a, lda, x, incx); + oneapi::math::blas::generic::MAJOR::trmv(selector.get_queue(), upper_lower, trans, unit_diag, n, + a, lda, x, incx); } void trmv(backend_selector selector, uplo upper_lower, transpose trans, diag unit_diag, std::int64_t n, sycl::buffer, 1>& a, std::int64_t lda, sycl::buffer, 1>& x, std::int64_t incx) { - oneapi::math::blas::generic::MAJOR::trmv(selector.get_queue(), upper_lower, trans, unit_diag, - n, a, lda, x, incx); + oneapi::math::blas::generic::MAJOR::trmv(selector.get_queue(), upper_lower, trans, unit_diag, n, + a, lda, x, incx); } void tpmv(backend_selector selector, uplo upper_lower, transpose trans, diag unit_diag, std::int64_t n, sycl::buffer& a, sycl::buffer& x, std::int64_t incx) { - oneapi::math::blas::generic::MAJOR::tpmv(selector.get_queue(), upper_lower, trans, unit_diag, - n, a, x, incx); + oneapi::math::blas::generic::MAJOR::tpmv(selector.get_queue(), upper_lower, trans, unit_diag, n, + a, x, incx); } void tpmv(backend_selector selector, uplo upper_lower, transpose trans, diag unit_diag, std::int64_t n, sycl::buffer& a, sycl::buffer& x, std::int64_t incx) { - oneapi::math::blas::generic::MAJOR::tpmv(selector.get_queue(), upper_lower, trans, unit_diag, - n, a, x, incx); + oneapi::math::blas::generic::MAJOR::tpmv(selector.get_queue(), upper_lower, trans, unit_diag, n, + a, x, incx); } void tpmv(backend_selector selector, uplo upper_lower, transpose trans, diag unit_diag, std::int64_t n, sycl::buffer, 1>& a, sycl::buffer, 1>& x, std::int64_t incx) { - oneapi::math::blas::generic::MAJOR::tpmv(selector.get_queue(), upper_lower, trans, unit_diag, - n, a, x, incx); + oneapi::math::blas::generic::MAJOR::tpmv(selector.get_queue(), upper_lower, trans, unit_diag, n, + a, x, incx); } void tpmv(backend_selector selector, uplo upper_lower, transpose trans, diag unit_diag, std::int64_t n, sycl::buffer, 1>& a, sycl::buffer, 1>& x, std::int64_t incx) { - oneapi::math::blas::generic::MAJOR::tpmv(selector.get_queue(), upper_lower, trans, unit_diag, - n, a, x, incx); + oneapi::math::blas::generic::MAJOR::tpmv(selector.get_queue(), upper_lower, trans, unit_diag, n, + a, x, incx); } -void spr(backend_selector selector, uplo upper_lower, std::int64_t n, - float alpha, sycl::buffer& x, std::int64_t incx, sycl::buffer& a) { +void spr(backend_selector selector, uplo upper_lower, std::int64_t n, float alpha, + sycl::buffer& x, std::int64_t incx, sycl::buffer& a) { oneapi::math::blas::generic::MAJOR::spr(selector.get_queue(), upper_lower, n, alpha, x, incx, - a); + a); } void spr(backend_selector selector, uplo upper_lower, std::int64_t n, double alpha, sycl::buffer& x, std::int64_t incx, sycl::buffer& a) { oneapi::math::blas::generic::MAJOR::spr(selector.get_queue(), upper_lower, n, alpha, x, incx, - a); + a); } void gemm_batch(backend_selector selector, transpose transa, transpose transb, @@ -139,8 +139,8 @@ void gemm_batch(backend_selector selector, transpose transa, t sycl::buffer& c, std::int64_t ldc, std::int64_t stride_c, std::int64_t batch_size) { oneapi::math::blas::generic::MAJOR::gemm_batch(selector.get_queue(), transa, transb, m, n, k, - alpha, a, lda, stride_a, b, ldb, stride_b, beta, - c, ldc, stride_c, batch_size); + alpha, a, lda, stride_a, b, ldb, stride_b, beta, + c, ldc, stride_c, batch_size); } void gemm_batch(backend_selector selector, transpose transa, transpose transb, @@ -150,8 +150,8 @@ void gemm_batch(backend_selector selector, transpose transa, t sycl::buffer& c, std::int64_t ldc, std::int64_t stride_c, std::int64_t batch_size) { oneapi::math::blas::generic::MAJOR::gemm_batch(selector.get_queue(), transa, transb, m, n, k, - alpha, a, lda, stride_a, b, ldb, stride_b, beta, - c, ldc, stride_c, batch_size); + alpha, a, lda, stride_a, b, ldb, stride_b, beta, + c, ldc, stride_c, batch_size); } void gemm_batch(backend_selector selector, transpose transa, transpose transb, @@ -161,8 +161,8 @@ void gemm_batch(backend_selector selector, transpose transa, t std::complex beta, sycl::buffer, 1>& c, std::int64_t ldc, std::int64_t stride_c, std::int64_t batch_size) { oneapi::math::blas::generic::MAJOR::gemm_batch(selector.get_queue(), transa, transb, m, n, k, - alpha, a, lda, stride_a, b, ldb, stride_b, beta, - c, ldc, stride_c, batch_size); + alpha, a, lda, stride_a, b, ldb, stride_b, beta, + c, ldc, stride_c, batch_size); } void gemm_batch(backend_selector selector, transpose transa, transpose transb, @@ -172,8 +172,8 @@ void gemm_batch(backend_selector selector, transpose transa, t std::complex beta, sycl::buffer, 1>& c, std::int64_t ldc, std::int64_t stride_c, std::int64_t batch_size) { oneapi::math::blas::generic::MAJOR::gemm_batch(selector.get_queue(), transa, transb, m, n, k, - alpha, a, lda, stride_a, b, ldb, stride_b, beta, - c, ldc, stride_c, batch_size); + alpha, a, lda, stride_a, b, ldb, stride_b, beta, + c, ldc, stride_c, batch_size); } void gemm_batch(backend_selector selector, transpose transa, transpose transb, @@ -183,8 +183,8 @@ void gemm_batch(backend_selector selector, transpose transa, t sycl::half beta, sycl::buffer& c, std::int64_t ldc, std::int64_t stride_c, std::int64_t batch_size) { oneapi::math::blas::generic::MAJOR::gemm_batch(selector.get_queue(), transa, transb, m, n, k, - alpha, a, lda, stride_a, b, ldb, stride_b, beta, - c, ldc, stride_c, batch_size); + alpha, a, lda, stride_a, b, ldb, stride_b, beta, + c, ldc, stride_c, batch_size); } void gemm_batch(backend_selector selector, transpose transa, transpose transb, @@ -194,8 +194,8 @@ void gemm_batch(backend_selector selector, transpose transa, t sycl::buffer& c, std::int64_t ldc, std::int64_t stride_c, std::int64_t batch_size) { oneapi::math::blas::generic::MAJOR::gemm_batch(selector.get_queue(), transa, transb, m, n, k, - alpha, a, lda, stride_a, b, ldb, stride_b, beta, - c, ldc, stride_c, batch_size); + alpha, a, lda, stride_a, b, ldb, stride_b, beta, + c, ldc, stride_c, batch_size); } void gemm_batch(backend_selector selector, transpose transa, transpose transb, @@ -205,8 +205,8 @@ void gemm_batch(backend_selector selector, transpose transa, t float beta, sycl::buffer& c, std::int64_t ldc, std::int64_t stride_c, std::int64_t batch_size) { oneapi::math::blas::generic::MAJOR::gemm_batch(selector.get_queue(), transa, transb, m, n, k, - alpha, a, lda, stride_a, b, ldb, stride_b, beta, - c, ldc, stride_c, batch_size); + alpha, a, lda, stride_a, b, ldb, stride_b, beta, + c, ldc, stride_c, batch_size); } void gemm_batch(backend_selector selector, transpose transa, transpose transb, @@ -216,22 +216,22 @@ void gemm_batch(backend_selector selector, transpose transa, t float beta, sycl::buffer& c, std::int64_t ldc, std::int64_t stride_c, std::int64_t batch_size) { oneapi::math::blas::generic::MAJOR::gemm_batch(selector.get_queue(), transa, transb, m, n, k, - alpha, a, lda, stride_a, b, ldb, stride_b, beta, - c, ldc, stride_c, batch_size); + alpha, a, lda, stride_a, b, ldb, stride_b, beta, + c, ldc, stride_c, batch_size); } void syrk(backend_selector selector, uplo upper_lower, transpose trans, std::int64_t n, std::int64_t k, float alpha, sycl::buffer& a, std::int64_t lda, float beta, sycl::buffer& c, std::int64_t ldc) { oneapi::math::blas::generic::MAJOR::syrk(selector.get_queue(), upper_lower, trans, n, k, alpha, - a, lda, beta, c, ldc); + a, lda, beta, c, ldc); } void syrk(backend_selector selector, uplo upper_lower, transpose trans, std::int64_t n, std::int64_t k, double alpha, sycl::buffer& a, std::int64_t lda, double beta, sycl::buffer& c, std::int64_t ldc) { oneapi::math::blas::generic::MAJOR::syrk(selector.get_queue(), upper_lower, trans, n, k, alpha, - a, lda, beta, c, ldc); + a, lda, beta, c, ldc); } void syrk(backend_selector selector, uplo upper_lower, transpose trans, @@ -239,7 +239,7 @@ void syrk(backend_selector selector, uplo upper_lower, transpo sycl::buffer, 1>& a, std::int64_t lda, std::complex beta, sycl::buffer, 1>& c, std::int64_t ldc) { oneapi::math::blas::generic::MAJOR::syrk(selector.get_queue(), upper_lower, trans, n, k, alpha, - a, lda, beta, c, ldc); + a, lda, beta, c, ldc); } void syrk(backend_selector selector, uplo upper_lower, transpose trans, @@ -247,7 +247,7 @@ void syrk(backend_selector selector, uplo upper_lower, transpo sycl::buffer, 1>& a, std::int64_t lda, std::complex beta, sycl::buffer, 1>& c, std::int64_t ldc) { oneapi::math::blas::generic::MAJOR::syrk(selector.get_queue(), upper_lower, trans, n, k, alpha, - a, lda, beta, c, ldc); + a, lda, beta, c, ldc); } void syrk_batch(backend_selector selector, uplo upper_lower, transpose trans, @@ -255,8 +255,8 @@ void syrk_batch(backend_selector selector, uplo upper_lower, t std::int64_t lda, std::int64_t stride_a, float beta, sycl::buffer& c, std::int64_t ldc, std::int64_t stride_c, std::int64_t batch_size) { oneapi::math::blas::generic::MAJOR::syrk_batch(selector.get_queue(), upper_lower, trans, n, k, - alpha, a, lda, stride_a, beta, c, ldc, stride_c, - batch_size); + alpha, a, lda, stride_a, beta, c, ldc, stride_c, + batch_size); } void syrk_batch(backend_selector selector, uplo upper_lower, transpose trans, @@ -264,8 +264,8 @@ void syrk_batch(backend_selector selector, uplo upper_lower, t std::int64_t lda, std::int64_t stride_a, double beta, sycl::buffer& c, std::int64_t ldc, std::int64_t stride_c, std::int64_t batch_size) { oneapi::math::blas::generic::MAJOR::syrk_batch(selector.get_queue(), upper_lower, trans, n, k, - alpha, a, lda, stride_a, beta, c, ldc, stride_c, - batch_size); + alpha, a, lda, stride_a, beta, c, ldc, stride_c, + batch_size); } void syrk_batch(backend_selector selector, uplo upper_lower, transpose trans, @@ -274,8 +274,8 @@ void syrk_batch(backend_selector selector, uplo upper_lower, t std::complex beta, sycl::buffer, 1>& c, std::int64_t ldc, std::int64_t stride_c, std::int64_t batch_size) { oneapi::math::blas::generic::MAJOR::syrk_batch(selector.get_queue(), upper_lower, trans, n, k, - alpha, a, lda, stride_a, beta, c, ldc, stride_c, - batch_size); + alpha, a, lda, stride_a, beta, c, ldc, stride_c, + batch_size); } void syrk_batch(backend_selector selector, uplo upper_lower, transpose trans, @@ -284,8 +284,8 @@ void syrk_batch(backend_selector selector, uplo upper_lower, t std::complex beta, sycl::buffer, 1>& c, std::int64_t ldc, std::int64_t stride_c, std::int64_t batch_size) { oneapi::math::blas::generic::MAJOR::syrk_batch(selector.get_queue(), upper_lower, trans, n, k, - alpha, a, lda, stride_a, beta, c, ldc, stride_c, - batch_size); + alpha, a, lda, stride_a, beta, c, ldc, stride_c, + batch_size); } void her2(backend_selector selector, uplo upper_lower, std::int64_t n, @@ -293,7 +293,7 @@ void her2(backend_selector selector, uplo upper_lower, std::in sycl::buffer, 1>& y, std::int64_t incy, sycl::buffer, 1>& a, std::int64_t lda) { oneapi::math::blas::generic::MAJOR::her2(selector.get_queue(), upper_lower, n, alpha, x, incx, - y, incy, a, lda); + y, incy, a, lda); } void her2(backend_selector selector, uplo upper_lower, std::int64_t n, @@ -301,23 +301,23 @@ void her2(backend_selector selector, uplo upper_lower, std::in sycl::buffer, 1>& y, std::int64_t incy, sycl::buffer, 1>& a, std::int64_t lda) { oneapi::math::blas::generic::MAJOR::her2(selector.get_queue(), upper_lower, n, alpha, x, incx, - y, incy, a, lda); + y, incy, a, lda); } void hbmv(backend_selector selector, uplo upper_lower, std::int64_t n, std::int64_t k, std::complex alpha, sycl::buffer, 1>& a, std::int64_t lda, sycl::buffer, 1>& x, std::int64_t incx, std::complex beta, sycl::buffer, 1>& y, std::int64_t incy) { - oneapi::math::blas::generic::MAJOR::hbmv(selector.get_queue(), upper_lower, n, k, alpha, a, - lda, x, incx, beta, y, incy); + oneapi::math::blas::generic::MAJOR::hbmv(selector.get_queue(), upper_lower, n, k, alpha, a, lda, + x, incx, beta, y, incy); } void hbmv(backend_selector selector, uplo upper_lower, std::int64_t n, std::int64_t k, std::complex alpha, sycl::buffer, 1>& a, std::int64_t lda, sycl::buffer, 1>& x, std::int64_t incx, std::complex beta, sycl::buffer, 1>& y, std::int64_t incy) { - oneapi::math::blas::generic::MAJOR::hbmv(selector.get_queue(), upper_lower, n, k, alpha, a, - lda, x, incx, beta, y, incy); + oneapi::math::blas::generic::MAJOR::hbmv(selector.get_queue(), upper_lower, n, k, alpha, a, lda, + x, incx, beta, y, incy); } void rot(backend_selector selector, std::int64_t n, @@ -370,99 +370,99 @@ void axpy_batch(backend_selector selector, std::int64_t n, flo sycl::buffer& x, std::int64_t incx, std::int64_t stridex, sycl::buffer& y, std::int64_t incy, std::int64_t stridey, std::int64_t batch_size) { - oneapi::math::blas::generic::MAJOR::axpy_batch(selector.get_queue(), n, alpha, x, incx, - stridex, y, incy, stridey, batch_size); + oneapi::math::blas::generic::MAJOR::axpy_batch(selector.get_queue(), n, alpha, x, incx, stridex, + y, incy, stridey, batch_size); } void axpy_batch(backend_selector selector, std::int64_t n, double alpha, sycl::buffer& x, std::int64_t incx, std::int64_t stridex, sycl::buffer& y, std::int64_t incy, std::int64_t stridey, std::int64_t batch_size) { - oneapi::math::blas::generic::MAJOR::axpy_batch(selector.get_queue(), n, alpha, x, incx, - stridex, y, incy, stridey, batch_size); + oneapi::math::blas::generic::MAJOR::axpy_batch(selector.get_queue(), n, alpha, x, incx, stridex, + y, incy, stridey, batch_size); } void axpy_batch(backend_selector selector, std::int64_t n, std::complex alpha, sycl::buffer, 1>& x, std::int64_t incx, std::int64_t stridex, sycl::buffer, 1>& y, std::int64_t incy, std::int64_t stridey, std::int64_t batch_size) { - oneapi::math::blas::generic::MAJOR::axpy_batch(selector.get_queue(), n, alpha, x, incx, - stridex, y, incy, stridey, batch_size); + oneapi::math::blas::generic::MAJOR::axpy_batch(selector.get_queue(), n, alpha, x, incx, stridex, + y, incy, stridey, batch_size); } void axpy_batch(backend_selector selector, std::int64_t n, std::complex alpha, sycl::buffer, 1>& x, std::int64_t incx, std::int64_t stridex, sycl::buffer, 1>& y, std::int64_t incy, std::int64_t stridey, std::int64_t batch_size) { - oneapi::math::blas::generic::MAJOR::axpy_batch(selector.get_queue(), n, alpha, x, incx, - stridex, y, incy, stridey, batch_size); + oneapi::math::blas::generic::MAJOR::axpy_batch(selector.get_queue(), n, alpha, x, incx, stridex, + y, incy, stridey, batch_size); } void axpby(backend_selector selector, std::int64_t n, float alpha, sycl::buffer& x, std::int64_t incx, float beta, sycl::buffer& y, std::int64_t incy) { oneapi::math::blas::generic::MAJOR::axpby(selector.get_queue(), n, alpha, x, incx, beta, y, - incy); + incy); } void axpby(backend_selector selector, std::int64_t n, double alpha, sycl::buffer& x, std::int64_t incx, double beta, sycl::buffer& y, std::int64_t incy) { oneapi::math::blas::generic::MAJOR::axpby(selector.get_queue(), n, alpha, x, incx, beta, y, - incy); + incy); } void axpby(backend_selector selector, std::int64_t n, std::complex alpha, sycl::buffer, 1>& x, std::int64_t incx, std::complex beta, sycl::buffer, 1>& y, std::int64_t incy) { oneapi::math::blas::generic::MAJOR::axpby(selector.get_queue(), n, alpha, x, incx, beta, y, - incy); + incy); } void axpby(backend_selector selector, std::int64_t n, std::complex alpha, sycl::buffer, 1>& x, std::int64_t incx, std::complex beta, sycl::buffer, 1>& y, std::int64_t incy) { oneapi::math::blas::generic::MAJOR::axpby(selector.get_queue(), n, alpha, x, incx, beta, y, - incy); + incy); } void sdsdot(backend_selector selector, std::int64_t n, float sb, sycl::buffer& x, std::int64_t incx, sycl::buffer& y, std::int64_t incy, sycl::buffer& result) { oneapi::math::blas::generic::MAJOR::sdsdot(selector.get_queue(), n, sb, x, incx, y, incy, - result); + result); } void gerc(backend_selector selector, std::int64_t m, std::int64_t n, std::complex alpha, sycl::buffer, 1>& x, std::int64_t incx, sycl::buffer, 1>& y, std::int64_t incy, sycl::buffer, 1>& a, std::int64_t lda) { - oneapi::math::blas::generic::MAJOR::gerc(selector.get_queue(), m, n, alpha, x, incx, y, incy, - a, lda); + oneapi::math::blas::generic::MAJOR::gerc(selector.get_queue(), m, n, alpha, x, incx, y, incy, a, + lda); } void gerc(backend_selector selector, std::int64_t m, std::int64_t n, std::complex alpha, sycl::buffer, 1>& x, std::int64_t incx, sycl::buffer, 1>& y, std::int64_t incy, sycl::buffer, 1>& a, std::int64_t lda) { - oneapi::math::blas::generic::MAJOR::gerc(selector.get_queue(), m, n, alpha, x, incx, y, incy, - a, lda); + oneapi::math::blas::generic::MAJOR::gerc(selector.get_queue(), m, n, alpha, x, incx, y, incy, a, + lda); } void syr2k(backend_selector selector, uplo upper_lower, transpose trans, std::int64_t n, std::int64_t k, float alpha, sycl::buffer& a, std::int64_t lda, sycl::buffer& b, std::int64_t ldb, float beta, sycl::buffer& c, std::int64_t ldc) { - oneapi::math::blas::generic::MAJOR::syr2k(selector.get_queue(), upper_lower, trans, n, k, - alpha, a, lda, b, ldb, beta, c, ldc); + oneapi::math::blas::generic::MAJOR::syr2k(selector.get_queue(), upper_lower, trans, n, k, alpha, + a, lda, b, ldb, beta, c, ldc); } void syr2k(backend_selector selector, uplo upper_lower, transpose trans, std::int64_t n, std::int64_t k, double alpha, sycl::buffer& a, std::int64_t lda, sycl::buffer& b, std::int64_t ldb, double beta, sycl::buffer& c, std::int64_t ldc) { - oneapi::math::blas::generic::MAJOR::syr2k(selector.get_queue(), upper_lower, trans, n, k, - alpha, a, lda, b, ldb, beta, c, ldc); + oneapi::math::blas::generic::MAJOR::syr2k(selector.get_queue(), upper_lower, trans, n, k, alpha, + a, lda, b, ldb, beta, c, ldc); } void syr2k(backend_selector selector, uplo upper_lower, transpose trans, @@ -470,8 +470,8 @@ void syr2k(backend_selector selector, uplo upper_lower, transp sycl::buffer, 1>& a, std::int64_t lda, sycl::buffer, 1>& b, std::int64_t ldb, std::complex beta, sycl::buffer, 1>& c, std::int64_t ldc) { - oneapi::math::blas::generic::MAJOR::syr2k(selector.get_queue(), upper_lower, trans, n, k, - alpha, a, lda, b, ldb, beta, c, ldc); + oneapi::math::blas::generic::MAJOR::syr2k(selector.get_queue(), upper_lower, trans, n, k, alpha, + a, lda, b, ldb, beta, c, ldc); } void syr2k(backend_selector selector, uplo upper_lower, transpose trans, @@ -479,8 +479,8 @@ void syr2k(backend_selector selector, uplo upper_lower, transp sycl::buffer, 1>& a, std::int64_t lda, sycl::buffer, 1>& b, std::int64_t ldb, std::complex beta, sycl::buffer, 1>& c, std::int64_t ldc) { - oneapi::math::blas::generic::MAJOR::syr2k(selector.get_queue(), upper_lower, trans, n, k, - alpha, a, lda, b, ldb, beta, c, ldc); + oneapi::math::blas::generic::MAJOR::syr2k(selector.get_queue(), upper_lower, trans, n, k, alpha, + a, lda, b, ldb, beta, c, ldc); } void gemv(backend_selector selector, transpose trans, std::int64_t m, @@ -488,7 +488,7 @@ void gemv(backend_selector selector, transpose trans, std::int sycl::buffer& x, std::int64_t incx, float beta, sycl::buffer& y, std::int64_t incy) { oneapi::math::blas::generic::MAJOR::gemv(selector.get_queue(), trans, m, n, alpha, a, lda, x, - incx, beta, y, incy); + incx, beta, y, incy); } void gemv(backend_selector selector, transpose trans, std::int64_t m, @@ -496,7 +496,7 @@ void gemv(backend_selector selector, transpose trans, std::int sycl::buffer& x, std::int64_t incx, double beta, sycl::buffer& y, std::int64_t incy) { oneapi::math::blas::generic::MAJOR::gemv(selector.get_queue(), trans, m, n, alpha, a, lda, x, - incx, beta, y, incy); + incx, beta, y, incy); } void gemv(backend_selector selector, transpose trans, std::int64_t m, @@ -504,7 +504,7 @@ void gemv(backend_selector selector, transpose trans, std::int std::int64_t lda, sycl::buffer, 1>& x, std::int64_t incx, std::complex beta, sycl::buffer, 1>& y, std::int64_t incy) { oneapi::math::blas::generic::MAJOR::gemv(selector.get_queue(), trans, m, n, alpha, a, lda, x, - incx, beta, y, incy); + incx, beta, y, incy); } void gemv(backend_selector selector, transpose trans, std::int64_t m, @@ -512,7 +512,7 @@ void gemv(backend_selector selector, transpose trans, std::int std::int64_t lda, sycl::buffer, 1>& x, std::int64_t incx, std::complex beta, sycl::buffer, 1>& y, std::int64_t incy) { oneapi::math::blas::generic::MAJOR::gemv(selector.get_queue(), trans, m, n, alpha, a, lda, x, - incx, beta, y, incy); + incx, beta, y, incy); } void gemv_batch(backend_selector selector, transpose trans, std::int64_t m, @@ -520,9 +520,9 @@ void gemv_batch(backend_selector selector, transpose trans, st std::int64_t stridea, sycl::buffer& x, std::int64_t incx, std::int64_t stridex, float beta, sycl::buffer& y, std::int64_t incy, std::int64_t stridey, std::int64_t batch_size) { - oneapi::math::blas::generic::MAJOR::gemv_batch(selector.get_queue(), trans, m, n, alpha, a, - lda, stridea, x, incx, stridex, beta, y, incy, - stridey, batch_size); + oneapi::math::blas::generic::MAJOR::gemv_batch(selector.get_queue(), trans, m, n, alpha, a, lda, + stridea, x, incx, stridex, beta, y, incy, + stridey, batch_size); } void gemv_batch(backend_selector selector, transpose trans, std::int64_t m, @@ -530,9 +530,9 @@ void gemv_batch(backend_selector selector, transpose trans, st std::int64_t stridea, sycl::buffer& x, std::int64_t incx, std::int64_t stridex, double beta, sycl::buffer& y, std::int64_t incy, std::int64_t stridey, std::int64_t batch_size) { - oneapi::math::blas::generic::MAJOR::gemv_batch(selector.get_queue(), trans, m, n, alpha, a, - lda, stridea, x, incx, stridex, beta, y, incy, - stridey, batch_size); + oneapi::math::blas::generic::MAJOR::gemv_batch(selector.get_queue(), trans, m, n, alpha, a, lda, + stridea, x, incx, stridex, beta, y, incy, + stridey, batch_size); } void gemv_batch(backend_selector selector, transpose trans, std::int64_t m, @@ -541,9 +541,9 @@ void gemv_batch(backend_selector selector, transpose trans, st std::int64_t incx, std::int64_t stridex, std::complex beta, sycl::buffer, 1>& y, std::int64_t incy, std::int64_t stridey, std::int64_t batch_size) { - oneapi::math::blas::generic::MAJOR::gemv_batch(selector.get_queue(), trans, m, n, alpha, a, - lda, stridea, x, incx, stridex, beta, y, incy, - stridey, batch_size); + oneapi::math::blas::generic::MAJOR::gemv_batch(selector.get_queue(), trans, m, n, alpha, a, lda, + stridea, x, incx, stridex, beta, y, incy, + stridey, batch_size); } void gemv_batch(backend_selector selector, transpose trans, std::int64_t m, @@ -552,9 +552,9 @@ void gemv_batch(backend_selector selector, transpose trans, st sycl::buffer, 1>& x, std::int64_t incx, std::int64_t stridex, std::complex beta, sycl::buffer, 1>& y, std::int64_t incy, std::int64_t stridey, std::int64_t batch_size) { - oneapi::math::blas::generic::MAJOR::gemv_batch(selector.get_queue(), trans, m, n, alpha, a, - lda, stridea, x, incx, stridex, beta, y, incy, - stridey, batch_size); + oneapi::math::blas::generic::MAJOR::gemv_batch(selector.get_queue(), trans, m, n, alpha, a, lda, + stridea, x, incx, stridex, beta, y, incy, + stridey, batch_size); } void dgmm_batch(backend_selector selector, side left_right, std::int64_t m, @@ -563,8 +563,8 @@ void dgmm_batch(backend_selector selector, side left_right, st sycl::buffer& c, std::int64_t ldc, std::int64_t stridec, std::int64_t batch_size) { oneapi::math::blas::generic::MAJOR::dgmm_batch(selector.get_queue(), left_right, m, n, a, lda, - stridea, x, incx, stridex, c, ldc, stridec, - batch_size); + stridea, x, incx, stridex, c, ldc, stridec, + batch_size); } void dgmm_batch(backend_selector selector, side left_right, std::int64_t m, @@ -573,8 +573,8 @@ void dgmm_batch(backend_selector selector, side left_right, st sycl::buffer& c, std::int64_t ldc, std::int64_t stridec, std::int64_t batch_size) { oneapi::math::blas::generic::MAJOR::dgmm_batch(selector.get_queue(), left_right, m, n, a, lda, - stridea, x, incx, stridex, c, ldc, stridec, - batch_size); + stridea, x, incx, stridex, c, ldc, stridec, + batch_size); } void dgmm_batch(backend_selector selector, side left_right, std::int64_t m, @@ -583,8 +583,8 @@ void dgmm_batch(backend_selector selector, side left_right, st std::int64_t stridex, sycl::buffer, 1>& c, std::int64_t ldc, std::int64_t stridec, std::int64_t batch_size) { oneapi::math::blas::generic::MAJOR::dgmm_batch(selector.get_queue(), left_right, m, n, a, lda, - stridea, x, incx, stridex, c, ldc, stridec, - batch_size); + stridea, x, incx, stridex, c, ldc, stridec, + batch_size); } void dgmm_batch(backend_selector selector, side left_right, std::int64_t m, @@ -593,36 +593,36 @@ void dgmm_batch(backend_selector selector, side left_right, st std::int64_t stridex, sycl::buffer, 1>& c, std::int64_t ldc, std::int64_t stridec, std::int64_t batch_size) { oneapi::math::blas::generic::MAJOR::dgmm_batch(selector.get_queue(), left_right, m, n, a, lda, - stridea, x, incx, stridex, c, ldc, stridec, - batch_size); + stridea, x, incx, stridex, c, ldc, stridec, + batch_size); } -void her(backend_selector selector, uplo upper_lower, std::int64_t n, - float alpha, sycl::buffer, 1>& x, std::int64_t incx, +void her(backend_selector selector, uplo upper_lower, std::int64_t n, float alpha, + sycl::buffer, 1>& x, std::int64_t incx, sycl::buffer, 1>& a, std::int64_t lda) { - oneapi::math::blas::generic::MAJOR::her(selector.get_queue(), upper_lower, n, alpha, x, incx, - a, lda); + oneapi::math::blas::generic::MAJOR::her(selector.get_queue(), upper_lower, n, alpha, x, incx, a, + lda); } void her(backend_selector selector, uplo upper_lower, std::int64_t n, double alpha, sycl::buffer, 1>& x, std::int64_t incx, sycl::buffer, 1>& a, std::int64_t lda) { - oneapi::math::blas::generic::MAJOR::her(selector.get_queue(), upper_lower, n, alpha, x, incx, - a, lda); + oneapi::math::blas::generic::MAJOR::her(selector.get_queue(), upper_lower, n, alpha, x, incx, a, + lda); } -void hpr(backend_selector selector, uplo upper_lower, std::int64_t n, - float alpha, sycl::buffer, 1>& x, std::int64_t incx, +void hpr(backend_selector selector, uplo upper_lower, std::int64_t n, float alpha, + sycl::buffer, 1>& x, std::int64_t incx, sycl::buffer, 1>& a) { oneapi::math::blas::generic::MAJOR::hpr(selector.get_queue(), upper_lower, n, alpha, x, incx, - a); + a); } void hpr(backend_selector selector, uplo upper_lower, std::int64_t n, double alpha, sycl::buffer, 1>& x, std::int64_t incx, sycl::buffer, 1>& a) { oneapi::math::blas::generic::MAJOR::hpr(selector.get_queue(), upper_lower, n, alpha, x, incx, - a); + a); } void iamin(backend_selector selector, std::int64_t n, sycl::buffer& x, @@ -652,7 +652,7 @@ void hpmv(backend_selector selector, uplo upper_lower, std::in sycl::buffer, 1>& x, std::int64_t incx, std::complex beta, sycl::buffer, 1>& y, std::int64_t incy) { oneapi::math::blas::generic::MAJOR::hpmv(selector.get_queue(), upper_lower, n, alpha, a, x, - incx, beta, y, incy); + incx, beta, y, incy); } void hpmv(backend_selector selector, uplo upper_lower, std::int64_t n, @@ -660,21 +660,21 @@ void hpmv(backend_selector selector, uplo upper_lower, std::in sycl::buffer, 1>& x, std::int64_t incx, std::complex beta, sycl::buffer, 1>& y, std::int64_t incy) { oneapi::math::blas::generic::MAJOR::hpmv(selector.get_queue(), upper_lower, n, alpha, a, x, - incx, beta, y, incy); + incx, beta, y, incy); } void spmv(backend_selector selector, uplo upper_lower, std::int64_t n, float alpha, sycl::buffer& a, sycl::buffer& x, std::int64_t incx, float beta, sycl::buffer& y, std::int64_t incy) { oneapi::math::blas::generic::MAJOR::spmv(selector.get_queue(), upper_lower, n, alpha, a, x, - incx, beta, y, incy); + incx, beta, y, incy); } void spmv(backend_selector selector, uplo upper_lower, std::int64_t n, double alpha, sycl::buffer& a, sycl::buffer& x, std::int64_t incx, double beta, sycl::buffer& y, std::int64_t incy) { oneapi::math::blas::generic::MAJOR::spmv(selector.get_queue(), upper_lower, n, alpha, a, x, - incx, beta, y, incy); + incx, beta, y, incy); } void gemm_bias(backend_selector selector, transpose transa, transpose transb, @@ -683,8 +683,8 @@ void gemm_bias(backend_selector selector, transpose transa, tr std::int64_t ldb, uint8_t bo, float beta, sycl::buffer& c, std::int64_t ldc, sycl::buffer& co) { oneapi::math::blas::generic::MAJOR::gemm_bias(selector.get_queue(), transa, transb, offsetc, m, - n, k, alpha, a, lda, ao, b, ldb, bo, beta, c, - ldc, co); + n, k, alpha, a, lda, ao, b, ldb, bo, beta, c, ldc, + co); } void gemm_bias(backend_selector selector, transpose transa, transpose transb, @@ -693,8 +693,8 @@ void gemm_bias(backend_selector selector, transpose transa, tr std::int64_t ldb, int8_t bo, float beta, sycl::buffer& c, std::int64_t ldc, sycl::buffer& co) { oneapi::math::blas::generic::MAJOR::gemm_bias(selector.get_queue(), transa, transb, offsetc, m, - n, k, alpha, a, lda, ao, b, ldb, bo, beta, c, - ldc, co); + n, k, alpha, a, lda, ao, b, ldb, bo, beta, c, ldc, + co); } void gemm_bias(backend_selector selector, transpose transa, transpose transb, @@ -703,8 +703,8 @@ void gemm_bias(backend_selector selector, transpose transa, tr sycl::buffer& b, std::int64_t ldb, int8_t bo, float beta, sycl::buffer& c, std::int64_t ldc, sycl::buffer& co) { oneapi::math::blas::generic::MAJOR::gemm_bias(selector.get_queue(), transa, transb, offsetc, m, - n, k, alpha, a, lda, ao, b, ldb, bo, beta, c, - ldc, co); + n, k, alpha, a, lda, ao, b, ldb, bo, beta, c, ldc, + co); } void gemm_bias(backend_selector selector, transpose transa, transpose transb, @@ -713,8 +713,8 @@ void gemm_bias(backend_selector selector, transpose transa, tr sycl::buffer& b, std::int64_t ldb, uint8_t bo, float beta, sycl::buffer& c, std::int64_t ldc, sycl::buffer& co) { oneapi::math::blas::generic::MAJOR::gemm_bias(selector.get_queue(), transa, transb, offsetc, m, - n, k, alpha, a, lda, ao, b, ldb, bo, beta, c, - ldc, co); + n, k, alpha, a, lda, ao, b, ldb, bo, beta, c, ldc, + co); } void swap(backend_selector selector, std::int64_t n, sycl::buffer& x, @@ -743,16 +743,16 @@ void geru(backend_selector selector, std::int64_t m, std::int6 std::complex alpha, sycl::buffer, 1>& x, std::int64_t incx, sycl::buffer, 1>& y, std::int64_t incy, sycl::buffer, 1>& a, std::int64_t lda) { - oneapi::math::blas::generic::MAJOR::geru(selector.get_queue(), m, n, alpha, x, incx, y, incy, - a, lda); + oneapi::math::blas::generic::MAJOR::geru(selector.get_queue(), m, n, alpha, x, incx, y, incy, a, + lda); } void geru(backend_selector selector, std::int64_t m, std::int64_t n, std::complex alpha, sycl::buffer, 1>& x, std::int64_t incx, sycl::buffer, 1>& y, std::int64_t incy, sycl::buffer, 1>& a, std::int64_t lda) { - oneapi::math::blas::generic::MAJOR::geru(selector.get_queue(), m, n, alpha, x, incx, y, incy, - a, lda); + oneapi::math::blas::generic::MAJOR::geru(selector.get_queue(), m, n, alpha, x, incx, y, incy, a, + lda); } void nrm2(backend_selector selector, std::int64_t n, @@ -782,7 +782,7 @@ void gemm(backend_selector selector, transpose transa, transpo std::int64_t lda, sycl::buffer& b, std::int64_t ldb, float beta, sycl::buffer& c, std::int64_t ldc) { oneapi::math::blas::generic::MAJOR::gemm(selector.get_queue(), transa, transb, m, n, k, alpha, - a, lda, b, ldb, beta, c, ldc); + a, lda, b, ldb, beta, c, ldc); } void gemm(backend_selector selector, transpose transa, transpose transb, @@ -790,7 +790,7 @@ void gemm(backend_selector selector, transpose transa, transpo std::int64_t lda, sycl::buffer& b, std::int64_t ldb, double beta, sycl::buffer& c, std::int64_t ldc) { oneapi::math::blas::generic::MAJOR::gemm(selector.get_queue(), transa, transb, m, n, k, alpha, - a, lda, b, ldb, beta, c, ldc); + a, lda, b, ldb, beta, c, ldc); } void gemm(backend_selector selector, transpose transa, transpose transb, @@ -799,7 +799,7 @@ void gemm(backend_selector selector, transpose transa, transpo sycl::buffer, 1>& b, std::int64_t ldb, std::complex beta, sycl::buffer, 1>& c, std::int64_t ldc) { oneapi::math::blas::generic::MAJOR::gemm(selector.get_queue(), transa, transb, m, n, k, alpha, - a, lda, b, ldb, beta, c, ldc); + a, lda, b, ldb, beta, c, ldc); } void gemm(backend_selector selector, transpose transa, transpose transb, @@ -808,7 +808,7 @@ void gemm(backend_selector selector, transpose transa, transpo sycl::buffer, 1>& b, std::int64_t ldb, std::complex beta, sycl::buffer, 1>& c, std::int64_t ldc) { oneapi::math::blas::generic::MAJOR::gemm(selector.get_queue(), transa, transb, m, n, k, alpha, - a, lda, b, ldb, beta, c, ldc); + a, lda, b, ldb, beta, c, ldc); } void gemm(backend_selector selector, transpose transa, transpose transb, @@ -816,7 +816,7 @@ void gemm(backend_selector selector, transpose transa, transpo sycl::buffer& a, std::int64_t lda, sycl::buffer& b, std::int64_t ldb, sycl::half beta, sycl::buffer& c, std::int64_t ldc) { oneapi::math::blas::generic::MAJOR::gemm(selector.get_queue(), transa, transb, m, n, k, alpha, - a, lda, b, ldb, beta, c, ldc); + a, lda, b, ldb, beta, c, ldc); } void gemm(backend_selector selector, transpose transa, transpose transb, @@ -824,7 +824,7 @@ void gemm(backend_selector selector, transpose transa, transpo sycl::buffer& a, std::int64_t lda, sycl::buffer& b, std::int64_t ldb, float beta, sycl::buffer& c, std::int64_t ldc) { oneapi::math::blas::generic::MAJOR::gemm(selector.get_queue(), transa, transb, m, n, k, alpha, - a, lda, b, ldb, beta, c, ldc); + a, lda, b, ldb, beta, c, ldc); } void gemm(backend_selector selector, transpose transa, transpose transb, @@ -832,35 +832,35 @@ void gemm(backend_selector selector, transpose transa, transpo std::int64_t lda, sycl::buffer& b, std::int64_t ldb, float beta, sycl::buffer& c, std::int64_t ldc) { oneapi::math::blas::generic::MAJOR::gemm(selector.get_queue(), transa, transb, m, n, k, alpha, - a, lda, b, ldb, beta, c, ldc); + a, lda, b, ldb, beta, c, ldc); } void syr2(backend_selector selector, uplo upper_lower, std::int64_t n, float alpha, sycl::buffer& x, std::int64_t incx, sycl::buffer& y, std::int64_t incy, sycl::buffer& a, std::int64_t lda) { oneapi::math::blas::generic::MAJOR::syr2(selector.get_queue(), upper_lower, n, alpha, x, incx, - y, incy, a, lda); + y, incy, a, lda); } void syr2(backend_selector selector, uplo upper_lower, std::int64_t n, double alpha, sycl::buffer& x, std::int64_t incx, sycl::buffer& y, std::int64_t incy, sycl::buffer& a, std::int64_t lda) { oneapi::math::blas::generic::MAJOR::syr2(selector.get_queue(), upper_lower, n, alpha, x, incx, - y, incy, a, lda); + y, incy, a, lda); } void ger(backend_selector selector, std::int64_t m, std::int64_t n, float alpha, sycl::buffer& x, std::int64_t incx, sycl::buffer& y, std::int64_t incy, sycl::buffer& a, std::int64_t lda) { oneapi::math::blas::generic::MAJOR::ger(selector.get_queue(), m, n, alpha, x, incx, y, incy, a, - lda); + lda); } void ger(backend_selector selector, std::int64_t m, std::int64_t n, double alpha, sycl::buffer& x, std::int64_t incx, sycl::buffer& y, std::int64_t incy, sycl::buffer& a, std::int64_t lda) { oneapi::math::blas::generic::MAJOR::ger(selector.get_queue(), m, n, alpha, x, incx, y, incy, a, - lda); + lda); } void trsm(backend_selector selector, side left_right, uplo upper_lower, @@ -868,7 +868,7 @@ void trsm(backend_selector selector, side left_right, uplo upp sycl::buffer& a, std::int64_t lda, sycl::buffer& b, std::int64_t ldb) { oneapi::math::blas::generic::MAJOR::trsm(selector.get_queue(), left_right, upper_lower, trans, - unit_diag, m, n, alpha, a, lda, b, ldb); + unit_diag, m, n, alpha, a, lda, b, ldb); } void trsm(backend_selector selector, side left_right, uplo upper_lower, @@ -876,7 +876,7 @@ void trsm(backend_selector selector, side left_right, uplo upp sycl::buffer& a, std::int64_t lda, sycl::buffer& b, std::int64_t ldb) { oneapi::math::blas::generic::MAJOR::trsm(selector.get_queue(), left_right, upper_lower, trans, - unit_diag, m, n, alpha, a, lda, b, ldb); + unit_diag, m, n, alpha, a, lda, b, ldb); } void trsm(backend_selector selector, side left_right, uplo upper_lower, @@ -884,7 +884,7 @@ void trsm(backend_selector selector, side left_right, uplo upp std::complex alpha, sycl::buffer, 1>& a, std::int64_t lda, sycl::buffer, 1>& b, std::int64_t ldb) { oneapi::math::blas::generic::MAJOR::trsm(selector.get_queue(), left_right, upper_lower, trans, - unit_diag, m, n, alpha, a, lda, b, ldb); + unit_diag, m, n, alpha, a, lda, b, ldb); } void trsm(backend_selector selector, side left_right, uplo upper_lower, @@ -892,7 +892,7 @@ void trsm(backend_selector selector, side left_right, uplo upp std::complex alpha, sycl::buffer, 1>& a, std::int64_t lda, sycl::buffer, 1>& b, std::int64_t ldb) { oneapi::math::blas::generic::MAJOR::trsm(selector.get_queue(), left_right, upper_lower, trans, - unit_diag, m, n, alpha, a, lda, b, ldb); + unit_diag, m, n, alpha, a, lda, b, ldb); } void dotu(backend_selector selector, std::int64_t n, @@ -915,7 +915,7 @@ void hemm(backend_selector selector, side left_right, uplo upp sycl::buffer, 1>& b, std::int64_t ldb, std::complex beta, sycl::buffer, 1>& c, std::int64_t ldc) { oneapi::math::blas::generic::MAJOR::hemm(selector.get_queue(), left_right, upper_lower, m, n, - alpha, a, lda, b, ldb, beta, c, ldc); + alpha, a, lda, b, ldb, beta, c, ldc); } void hemm(backend_selector selector, side left_right, uplo upper_lower, @@ -924,7 +924,7 @@ void hemm(backend_selector selector, side left_right, uplo upp sycl::buffer, 1>& b, std::int64_t ldb, std::complex beta, sycl::buffer, 1>& c, std::int64_t ldc) { oneapi::math::blas::generic::MAJOR::hemm(selector.get_queue(), left_right, upper_lower, m, n, - alpha, a, lda, b, ldb, beta, c, ldc); + alpha, a, lda, b, ldb, beta, c, ldc); } void hpr2(backend_selector selector, uplo upper_lower, std::int64_t n, @@ -932,7 +932,7 @@ void hpr2(backend_selector selector, uplo upper_lower, std::in sycl::buffer, 1>& y, std::int64_t incy, sycl::buffer, 1>& a) { oneapi::math::blas::generic::MAJOR::hpr2(selector.get_queue(), upper_lower, n, alpha, x, incx, - y, incy, a); + y, incy, a); } void hpr2(backend_selector selector, uplo upper_lower, std::int64_t n, @@ -940,7 +940,7 @@ void hpr2(backend_selector selector, uplo upper_lower, std::in sycl::buffer, 1>& y, std::int64_t incy, sycl::buffer, 1>& a) { oneapi::math::blas::generic::MAJOR::hpr2(selector.get_queue(), upper_lower, n, alpha, x, incx, - y, incy, a); + y, incy, a); } void gbmv(backend_selector selector, transpose trans, std::int64_t m, @@ -948,7 +948,7 @@ void gbmv(backend_selector selector, transpose trans, std::int std::int64_t lda, sycl::buffer& x, std::int64_t incx, float beta, sycl::buffer& y, std::int64_t incy) { oneapi::math::blas::generic::MAJOR::gbmv(selector.get_queue(), trans, m, n, kl, ku, alpha, a, - lda, x, incx, beta, y, incy); + lda, x, incx, beta, y, incy); } void gbmv(backend_selector selector, transpose trans, std::int64_t m, @@ -956,7 +956,7 @@ void gbmv(backend_selector selector, transpose trans, std::int sycl::buffer& a, std::int64_t lda, sycl::buffer& x, std::int64_t incx, double beta, sycl::buffer& y, std::int64_t incy) { oneapi::math::blas::generic::MAJOR::gbmv(selector.get_queue(), trans, m, n, kl, ku, alpha, a, - lda, x, incx, beta, y, incy); + lda, x, incx, beta, y, incy); } void gbmv(backend_selector selector, transpose trans, std::int64_t m, @@ -965,7 +965,7 @@ void gbmv(backend_selector selector, transpose trans, std::int sycl::buffer, 1>& x, std::int64_t incx, std::complex beta, sycl::buffer, 1>& y, std::int64_t incy) { oneapi::math::blas::generic::MAJOR::gbmv(selector.get_queue(), trans, m, n, kl, ku, alpha, a, - lda, x, incx, beta, y, incy); + lda, x, incx, beta, y, incy); } void gbmv(backend_selector selector, transpose trans, std::int64_t m, @@ -974,35 +974,35 @@ void gbmv(backend_selector selector, transpose trans, std::int sycl::buffer, 1>& x, std::int64_t incx, std::complex beta, sycl::buffer, 1>& y, std::int64_t incy) { oneapi::math::blas::generic::MAJOR::gbmv(selector.get_queue(), trans, m, n, kl, ku, alpha, a, - lda, x, incx, beta, y, incy); + lda, x, incx, beta, y, incy); } void tbmv(backend_selector selector, uplo upper_lower, transpose trans, diag unit_diag, std::int64_t n, std::int64_t k, sycl::buffer& a, std::int64_t lda, sycl::buffer& x, std::int64_t incx) { - oneapi::math::blas::generic::MAJOR::tbmv(selector.get_queue(), upper_lower, trans, unit_diag, - n, k, a, lda, x, incx); + oneapi::math::blas::generic::MAJOR::tbmv(selector.get_queue(), upper_lower, trans, unit_diag, n, + k, a, lda, x, incx); } void tbmv(backend_selector selector, uplo upper_lower, transpose trans, diag unit_diag, std::int64_t n, std::int64_t k, sycl::buffer& a, std::int64_t lda, sycl::buffer& x, std::int64_t incx) { - oneapi::math::blas::generic::MAJOR::tbmv(selector.get_queue(), upper_lower, trans, unit_diag, - n, k, a, lda, x, incx); + oneapi::math::blas::generic::MAJOR::tbmv(selector.get_queue(), upper_lower, trans, unit_diag, n, + k, a, lda, x, incx); } void tbmv(backend_selector selector, uplo upper_lower, transpose trans, diag unit_diag, std::int64_t n, std::int64_t k, sycl::buffer, 1>& a, std::int64_t lda, sycl::buffer, 1>& x, std::int64_t incx) { - oneapi::math::blas::generic::MAJOR::tbmv(selector.get_queue(), upper_lower, trans, unit_diag, - n, k, a, lda, x, incx); + oneapi::math::blas::generic::MAJOR::tbmv(selector.get_queue(), upper_lower, trans, unit_diag, n, + k, a, lda, x, incx); } void tbmv(backend_selector selector, uplo upper_lower, transpose trans, diag unit_diag, std::int64_t n, std::int64_t k, sycl::buffer, 1>& a, std::int64_t lda, sycl::buffer, 1>& x, std::int64_t incx) { - oneapi::math::blas::generic::MAJOR::tbmv(selector.get_queue(), upper_lower, trans, unit_diag, - n, k, a, lda, x, incx); + oneapi::math::blas::generic::MAJOR::tbmv(selector.get_queue(), upper_lower, trans, unit_diag, n, + k, a, lda, x, incx); } void symm(backend_selector selector, side left_right, uplo upper_lower, @@ -1010,7 +1010,7 @@ void symm(backend_selector selector, side left_right, uplo upp sycl::buffer& b, std::int64_t ldb, float beta, sycl::buffer& c, std::int64_t ldc) { oneapi::math::blas::generic::MAJOR::symm(selector.get_queue(), left_right, upper_lower, m, n, - alpha, a, lda, b, ldb, beta, c, ldc); + alpha, a, lda, b, ldb, beta, c, ldc); } void symm(backend_selector selector, side left_right, uplo upper_lower, @@ -1018,7 +1018,7 @@ void symm(backend_selector selector, side left_right, uplo upp std::int64_t lda, sycl::buffer& b, std::int64_t ldb, double beta, sycl::buffer& c, std::int64_t ldc) { oneapi::math::blas::generic::MAJOR::symm(selector.get_queue(), left_right, upper_lower, m, n, - alpha, a, lda, b, ldb, beta, c, ldc); + alpha, a, lda, b, ldb, beta, c, ldc); } void symm(backend_selector selector, side left_right, uplo upper_lower, @@ -1027,7 +1027,7 @@ void symm(backend_selector selector, side left_right, uplo upp sycl::buffer, 1>& b, std::int64_t ldb, std::complex beta, sycl::buffer, 1>& c, std::int64_t ldc) { oneapi::math::blas::generic::MAJOR::symm(selector.get_queue(), left_right, upper_lower, m, n, - alpha, a, lda, b, ldb, beta, c, ldc); + alpha, a, lda, b, ldb, beta, c, ldc); } void symm(backend_selector selector, side left_right, uplo upper_lower, @@ -1036,7 +1036,7 @@ void symm(backend_selector selector, side left_right, uplo upp sycl::buffer, 1>& b, std::int64_t ldb, std::complex beta, sycl::buffer, 1>& c, std::int64_t ldc) { oneapi::math::blas::generic::MAJOR::symm(selector.get_queue(), left_right, upper_lower, m, n, - alpha, a, lda, b, ldb, beta, c, ldc); + alpha, a, lda, b, ldb, beta, c, ldc); } void dotc(backend_selector selector, std::int64_t n, @@ -1053,18 +1053,18 @@ void dotc(backend_selector selector, std::int64_t n, oneapi::math::blas::generic::MAJOR::dotc(selector.get_queue(), n, x, incx, y, incy, result); } -void syr(backend_selector selector, uplo upper_lower, std::int64_t n, - float alpha, sycl::buffer& x, std::int64_t incx, sycl::buffer& a, +void syr(backend_selector selector, uplo upper_lower, std::int64_t n, float alpha, + sycl::buffer& x, std::int64_t incx, sycl::buffer& a, std::int64_t lda) { - oneapi::math::blas::generic::MAJOR::syr(selector.get_queue(), upper_lower, n, alpha, x, incx, - a, lda); + oneapi::math::blas::generic::MAJOR::syr(selector.get_queue(), upper_lower, n, alpha, x, incx, a, + lda); } void syr(backend_selector selector, uplo upper_lower, std::int64_t n, double alpha, sycl::buffer& x, std::int64_t incx, sycl::buffer& a, std::int64_t lda) { - oneapi::math::blas::generic::MAJOR::syr(selector.get_queue(), upper_lower, n, alpha, x, incx, - a, lda); + oneapi::math::blas::generic::MAJOR::syr(selector.get_queue(), upper_lower, n, alpha, x, incx, a, + lda); } void trmm(backend_selector selector, side left_right, uplo upper_lower, @@ -1072,7 +1072,7 @@ void trmm(backend_selector selector, side left_right, uplo upp sycl::buffer& a, std::int64_t lda, sycl::buffer& b, std::int64_t ldb) { oneapi::math::blas::generic::MAJOR::trmm(selector.get_queue(), left_right, upper_lower, trans, - unit_diag, m, n, alpha, a, lda, b, ldb); + unit_diag, m, n, alpha, a, lda, b, ldb); } void trmm(backend_selector selector, side left_right, uplo upper_lower, @@ -1080,7 +1080,7 @@ void trmm(backend_selector selector, side left_right, uplo upp sycl::buffer& a, std::int64_t lda, sycl::buffer& b, std::int64_t ldb) { oneapi::math::blas::generic::MAJOR::trmm(selector.get_queue(), left_right, upper_lower, trans, - unit_diag, m, n, alpha, a, lda, b, ldb); + unit_diag, m, n, alpha, a, lda, b, ldb); } void trmm(backend_selector selector, side left_right, uplo upper_lower, @@ -1088,7 +1088,7 @@ void trmm(backend_selector selector, side left_right, uplo upp std::complex alpha, sycl::buffer, 1>& a, std::int64_t lda, sycl::buffer, 1>& b, std::int64_t ldb) { oneapi::math::blas::generic::MAJOR::trmm(selector.get_queue(), left_right, upper_lower, trans, - unit_diag, m, n, alpha, a, lda, b, ldb); + unit_diag, m, n, alpha, a, lda, b, ldb); } void trmm(backend_selector selector, side left_right, uplo upper_lower, @@ -1096,7 +1096,7 @@ void trmm(backend_selector selector, side left_right, uplo upp std::complex alpha, sycl::buffer, 1>& a, std::int64_t lda, sycl::buffer, 1>& b, std::int64_t ldb) { oneapi::math::blas::generic::MAJOR::trmm(selector.get_queue(), left_right, upper_lower, trans, - unit_diag, m, n, alpha, a, lda, b, ldb); + unit_diag, m, n, alpha, a, lda, b, ldb); } void rotmg(backend_selector selector, sycl::buffer& d1, @@ -1114,57 +1114,57 @@ void rotmg(backend_selector selector, sycl::buffer& void tpsv(backend_selector selector, uplo upper_lower, transpose trans, diag unit_diag, std::int64_t n, sycl::buffer& a, sycl::buffer& x, std::int64_t incx) { - oneapi::math::blas::generic::MAJOR::tpsv(selector.get_queue(), upper_lower, trans, unit_diag, - n, a, x, incx); + oneapi::math::blas::generic::MAJOR::tpsv(selector.get_queue(), upper_lower, trans, unit_diag, n, + a, x, incx); } void tpsv(backend_selector selector, uplo upper_lower, transpose trans, diag unit_diag, std::int64_t n, sycl::buffer& a, sycl::buffer& x, std::int64_t incx) { - oneapi::math::blas::generic::MAJOR::tpsv(selector.get_queue(), upper_lower, trans, unit_diag, - n, a, x, incx); + oneapi::math::blas::generic::MAJOR::tpsv(selector.get_queue(), upper_lower, trans, unit_diag, n, + a, x, incx); } void tpsv(backend_selector selector, uplo upper_lower, transpose trans, diag unit_diag, std::int64_t n, sycl::buffer, 1>& a, sycl::buffer, 1>& x, std::int64_t incx) { - oneapi::math::blas::generic::MAJOR::tpsv(selector.get_queue(), upper_lower, trans, unit_diag, - n, a, x, incx); + oneapi::math::blas::generic::MAJOR::tpsv(selector.get_queue(), upper_lower, trans, unit_diag, n, + a, x, incx); } void tpsv(backend_selector selector, uplo upper_lower, transpose trans, diag unit_diag, std::int64_t n, sycl::buffer, 1>& a, sycl::buffer, 1>& x, std::int64_t incx) { - oneapi::math::blas::generic::MAJOR::tpsv(selector.get_queue(), upper_lower, trans, unit_diag, - n, a, x, incx); + oneapi::math::blas::generic::MAJOR::tpsv(selector.get_queue(), upper_lower, trans, unit_diag, n, + a, x, incx); } void trsv(backend_selector selector, uplo upper_lower, transpose trans, diag unit_diag, std::int64_t n, sycl::buffer& a, std::int64_t lda, sycl::buffer& x, std::int64_t incx) { - oneapi::math::blas::generic::MAJOR::trsv(selector.get_queue(), upper_lower, trans, unit_diag, - n, a, lda, x, incx); + oneapi::math::blas::generic::MAJOR::trsv(selector.get_queue(), upper_lower, trans, unit_diag, n, + a, lda, x, incx); } void trsv(backend_selector selector, uplo upper_lower, transpose trans, diag unit_diag, std::int64_t n, sycl::buffer& a, std::int64_t lda, sycl::buffer& x, std::int64_t incx) { - oneapi::math::blas::generic::MAJOR::trsv(selector.get_queue(), upper_lower, trans, unit_diag, - n, a, lda, x, incx); + oneapi::math::blas::generic::MAJOR::trsv(selector.get_queue(), upper_lower, trans, unit_diag, n, + a, lda, x, incx); } void trsv(backend_selector selector, uplo upper_lower, transpose trans, diag unit_diag, std::int64_t n, sycl::buffer, 1>& a, std::int64_t lda, sycl::buffer, 1>& x, std::int64_t incx) { - oneapi::math::blas::generic::MAJOR::trsv(selector.get_queue(), upper_lower, trans, unit_diag, - n, a, lda, x, incx); + oneapi::math::blas::generic::MAJOR::trsv(selector.get_queue(), upper_lower, trans, unit_diag, n, + a, lda, x, incx); } void trsv(backend_selector selector, uplo upper_lower, transpose trans, diag unit_diag, std::int64_t n, sycl::buffer, 1>& a, std::int64_t lda, sycl::buffer, 1>& x, std::int64_t incx) { - oneapi::math::blas::generic::MAJOR::trsv(selector.get_queue(), upper_lower, trans, unit_diag, - n, a, lda, x, incx); + oneapi::math::blas::generic::MAJOR::trsv(selector.get_queue(), upper_lower, trans, unit_diag, n, + a, lda, x, incx); } void copy(backend_selector selector, std::int64_t n, sycl::buffer& x, @@ -1194,7 +1194,7 @@ void copy_batch(backend_selector selector, std::int64_t n, sycl::buffer& y, std::int64_t incy, std::int64_t stridey, std::int64_t batch_size) { oneapi::math::blas::generic::MAJOR::copy_batch(selector.get_queue(), n, x, incx, stridex, y, - incy, stridey, batch_size); + incy, stridey, batch_size); } void copy_batch(backend_selector selector, std::int64_t n, @@ -1202,7 +1202,7 @@ void copy_batch(backend_selector selector, std::int64_t n, sycl::buffer& y, std::int64_t incy, std::int64_t stridey, std::int64_t batch_size) { oneapi::math::blas::generic::MAJOR::copy_batch(selector.get_queue(), n, x, incx, stridex, y, - incy, stridey, batch_size); + incy, stridey, batch_size); } void copy_batch(backend_selector selector, std::int64_t n, @@ -1210,7 +1210,7 @@ void copy_batch(backend_selector selector, std::int64_t n, sycl::buffer, 1>& y, std::int64_t incy, std::int64_t stridey, std::int64_t batch_size) { oneapi::math::blas::generic::MAJOR::copy_batch(selector.get_queue(), n, x, incx, stridex, y, - incy, stridey, batch_size); + incy, stridey, batch_size); } void copy_batch(backend_selector selector, std::int64_t n, @@ -1218,23 +1218,23 @@ void copy_batch(backend_selector selector, std::int64_t n, sycl::buffer, 1>& y, std::int64_t incy, std::int64_t stridey, std::int64_t batch_size) { oneapi::math::blas::generic::MAJOR::copy_batch(selector.get_queue(), n, x, incx, stridex, y, - incy, stridey, batch_size); + incy, stridey, batch_size); } void hemv(backend_selector selector, uplo upper_lower, std::int64_t n, std::complex alpha, sycl::buffer, 1>& a, std::int64_t lda, sycl::buffer, 1>& x, std::int64_t incx, std::complex beta, sycl::buffer, 1>& y, std::int64_t incy) { - oneapi::math::blas::generic::MAJOR::hemv(selector.get_queue(), upper_lower, n, alpha, a, lda, - x, incx, beta, y, incy); + oneapi::math::blas::generic::MAJOR::hemv(selector.get_queue(), upper_lower, n, alpha, a, lda, x, + incx, beta, y, incy); } void hemv(backend_selector selector, uplo upper_lower, std::int64_t n, std::complex alpha, sycl::buffer, 1>& a, std::int64_t lda, sycl::buffer, 1>& x, std::int64_t incx, std::complex beta, sycl::buffer, 1>& y, std::int64_t incy) { - oneapi::math::blas::generic::MAJOR::hemv(selector.get_queue(), upper_lower, n, alpha, a, lda, - x, incx, beta, y, incy); + oneapi::math::blas::generic::MAJOR::hemv(selector.get_queue(), upper_lower, n, alpha, a, lda, x, + incx, beta, y, incy); } void gemmt(backend_selector selector, uplo upper_lower, transpose transa, @@ -1242,7 +1242,7 @@ void gemmt(backend_selector selector, uplo upper_lower, transp std::int64_t lda, sycl::buffer& b, std::int64_t ldb, float beta, sycl::buffer& c, std::int64_t ldc) { oneapi::math::blas::generic::MAJOR::gemmt(selector.get_queue(), upper_lower, transa, transb, n, - k, alpha, a, lda, b, ldb, beta, c, ldc); + k, alpha, a, lda, b, ldb, beta, c, ldc); } void gemmt(backend_selector selector, uplo upper_lower, transpose transa, @@ -1250,7 +1250,7 @@ void gemmt(backend_selector selector, uplo upper_lower, transp sycl::buffer& a, std::int64_t lda, sycl::buffer& b, std::int64_t ldb, double beta, sycl::buffer& c, std::int64_t ldc) { oneapi::math::blas::generic::MAJOR::gemmt(selector.get_queue(), upper_lower, transa, transb, n, - k, alpha, a, lda, b, ldb, beta, c, ldc); + k, alpha, a, lda, b, ldb, beta, c, ldc); } void gemmt(backend_selector selector, uplo upper_lower, transpose transa, @@ -1259,7 +1259,7 @@ void gemmt(backend_selector selector, uplo upper_lower, transp sycl::buffer, 1>& b, std::int64_t ldb, std::complex beta, sycl::buffer, 1>& c, std::int64_t ldc) { oneapi::math::blas::generic::MAJOR::gemmt(selector.get_queue(), upper_lower, transa, transb, n, - k, alpha, a, lda, b, ldb, beta, c, ldc); + k, alpha, a, lda, b, ldb, beta, c, ldc); } void gemmt(backend_selector selector, uplo upper_lower, transpose transa, @@ -1268,7 +1268,7 @@ void gemmt(backend_selector selector, uplo upper_lower, transp sycl::buffer, 1>& b, std::int64_t ldb, std::complex beta, sycl::buffer, 1>& c, std::int64_t ldc) { oneapi::math::blas::generic::MAJOR::gemmt(selector.get_queue(), upper_lower, transa, transb, n, - k, alpha, a, lda, b, ldb, beta, c, ldc); + k, alpha, a, lda, b, ldb, beta, c, ldc); } void asum(backend_selector selector, std::int64_t n, @@ -1297,58 +1297,58 @@ void sbmv(backend_selector selector, uplo upper_lower, std::in std::int64_t k, float alpha, sycl::buffer& a, std::int64_t lda, sycl::buffer& x, std::int64_t incx, float beta, sycl::buffer& y, std::int64_t incy) { - oneapi::math::blas::generic::MAJOR::sbmv(selector.get_queue(), upper_lower, n, k, alpha, a, - lda, x, incx, beta, y, incy); + oneapi::math::blas::generic::MAJOR::sbmv(selector.get_queue(), upper_lower, n, k, alpha, a, lda, + x, incx, beta, y, incy); } void sbmv(backend_selector selector, uplo upper_lower, std::int64_t n, std::int64_t k, double alpha, sycl::buffer& a, std::int64_t lda, sycl::buffer& x, std::int64_t incx, double beta, sycl::buffer& y, std::int64_t incy) { - oneapi::math::blas::generic::MAJOR::sbmv(selector.get_queue(), upper_lower, n, k, alpha, a, - lda, x, incx, beta, y, incy); + oneapi::math::blas::generic::MAJOR::sbmv(selector.get_queue(), upper_lower, n, k, alpha, a, lda, + x, incx, beta, y, incy); } void tbsv(backend_selector selector, uplo upper_lower, transpose trans, diag unit_diag, std::int64_t n, std::int64_t k, sycl::buffer& a, std::int64_t lda, sycl::buffer& x, std::int64_t incx) { - oneapi::math::blas::generic::MAJOR::tbsv(selector.get_queue(), upper_lower, trans, unit_diag, - n, k, a, lda, x, incx); + oneapi::math::blas::generic::MAJOR::tbsv(selector.get_queue(), upper_lower, trans, unit_diag, n, + k, a, lda, x, incx); } void tbsv(backend_selector selector, uplo upper_lower, transpose trans, diag unit_diag, std::int64_t n, std::int64_t k, sycl::buffer& a, std::int64_t lda, sycl::buffer& x, std::int64_t incx) { - oneapi::math::blas::generic::MAJOR::tbsv(selector.get_queue(), upper_lower, trans, unit_diag, - n, k, a, lda, x, incx); + oneapi::math::blas::generic::MAJOR::tbsv(selector.get_queue(), upper_lower, trans, unit_diag, n, + k, a, lda, x, incx); } void tbsv(backend_selector selector, uplo upper_lower, transpose trans, diag unit_diag, std::int64_t n, std::int64_t k, sycl::buffer, 1>& a, std::int64_t lda, sycl::buffer, 1>& x, std::int64_t incx) { - oneapi::math::blas::generic::MAJOR::tbsv(selector.get_queue(), upper_lower, trans, unit_diag, - n, k, a, lda, x, incx); + oneapi::math::blas::generic::MAJOR::tbsv(selector.get_queue(), upper_lower, trans, unit_diag, n, + k, a, lda, x, incx); } void tbsv(backend_selector selector, uplo upper_lower, transpose trans, diag unit_diag, std::int64_t n, std::int64_t k, sycl::buffer, 1>& a, std::int64_t lda, sycl::buffer, 1>& x, std::int64_t incx) { - oneapi::math::blas::generic::MAJOR::tbsv(selector.get_queue(), upper_lower, trans, unit_diag, - n, k, a, lda, x, incx); + oneapi::math::blas::generic::MAJOR::tbsv(selector.get_queue(), upper_lower, trans, unit_diag, n, + k, a, lda, x, incx); } void spr2(backend_selector selector, uplo upper_lower, std::int64_t n, float alpha, sycl::buffer& x, std::int64_t incx, sycl::buffer& y, std::int64_t incy, sycl::buffer& a) { oneapi::math::blas::generic::MAJOR::spr2(selector.get_queue(), upper_lower, n, alpha, x, incx, - y, incy, a); + y, incy, a); } void spr2(backend_selector selector, uplo upper_lower, std::int64_t n, double alpha, sycl::buffer& x, std::int64_t incx, sycl::buffer& y, std::int64_t incy, sycl::buffer& a) { oneapi::math::blas::generic::MAJOR::spr2(selector.get_queue(), upper_lower, n, alpha, x, incx, - y, incy, a); + y, incy, a); } void iamax(backend_selector selector, std::int64_t n, sycl::buffer& x, @@ -1409,8 +1409,8 @@ void trsm_batch(backend_selector selector, side left_right, up sycl::buffer& b, std::int64_t ldb, std::int64_t stride_b, std::int64_t batch_size) { oneapi::math::blas::generic::MAJOR::trsm_batch(selector.get_queue(), left_right, upper_lower, - trans, unit_diag, m, n, alpha, a, lda, stride_a, - b, ldb, stride_b, batch_size); + trans, unit_diag, m, n, alpha, a, lda, stride_a, + b, ldb, stride_b, batch_size); } void trsm_batch(backend_selector selector, side left_right, uplo upper_lower, @@ -1419,8 +1419,8 @@ void trsm_batch(backend_selector selector, side left_right, up sycl::buffer& b, std::int64_t ldb, std::int64_t stride_b, std::int64_t batch_size) { oneapi::math::blas::generic::MAJOR::trsm_batch(selector.get_queue(), left_right, upper_lower, - trans, unit_diag, m, n, alpha, a, lda, stride_a, - b, ldb, stride_b, batch_size); + trans, unit_diag, m, n, alpha, a, lda, stride_a, + b, ldb, stride_b, batch_size); } void trsm_batch(backend_selector selector, side left_right, uplo upper_lower, @@ -1429,8 +1429,8 @@ void trsm_batch(backend_selector selector, side left_right, up std::int64_t lda, std::int64_t stride_a, sycl::buffer, 1>& b, std::int64_t ldb, std::int64_t stride_b, std::int64_t batch_size) { oneapi::math::blas::generic::MAJOR::trsm_batch(selector.get_queue(), left_right, upper_lower, - trans, unit_diag, m, n, alpha, a, lda, stride_a, - b, ldb, stride_b, batch_size); + trans, unit_diag, m, n, alpha, a, lda, stride_a, + b, ldb, stride_b, batch_size); } void trsm_batch(backend_selector selector, side left_right, uplo upper_lower, @@ -1439,8 +1439,8 @@ void trsm_batch(backend_selector selector, side left_right, up std::int64_t lda, std::int64_t stride_a, sycl::buffer, 1>& b, std::int64_t ldb, std::int64_t stride_b, std::int64_t batch_size) { oneapi::math::blas::generic::MAJOR::trsm_batch(selector.get_queue(), left_right, upper_lower, - trans, unit_diag, m, n, alpha, a, lda, stride_a, - b, ldb, stride_b, batch_size); + trans, unit_diag, m, n, alpha, a, lda, stride_a, + b, ldb, stride_b, batch_size); } void her2k(backend_selector selector, uplo upper_lower, transpose trans, @@ -1448,8 +1448,8 @@ void her2k(backend_selector selector, uplo upper_lower, transp sycl::buffer, 1>& a, std::int64_t lda, sycl::buffer, 1>& b, std::int64_t ldb, float beta, sycl::buffer, 1>& c, std::int64_t ldc) { - oneapi::math::blas::generic::MAJOR::her2k(selector.get_queue(), upper_lower, trans, n, k, - alpha, a, lda, b, ldb, beta, c, ldc); + oneapi::math::blas::generic::MAJOR::her2k(selector.get_queue(), upper_lower, trans, n, k, alpha, + a, lda, b, ldb, beta, c, ldc); } void her2k(backend_selector selector, uplo upper_lower, transpose trans, @@ -1457,8 +1457,8 @@ void her2k(backend_selector selector, uplo upper_lower, transp sycl::buffer, 1>& a, std::int64_t lda, sycl::buffer, 1>& b, std::int64_t ldb, double beta, sycl::buffer, 1>& c, std::int64_t ldc) { - oneapi::math::blas::generic::MAJOR::her2k(selector.get_queue(), upper_lower, trans, n, k, - alpha, a, lda, b, ldb, beta, c, ldc); + oneapi::math::blas::generic::MAJOR::her2k(selector.get_queue(), upper_lower, trans, n, k, alpha, + a, lda, b, ldb, beta, c, ldc); } void rotg(backend_selector selector, sycl::buffer& a, @@ -1486,31 +1486,31 @@ void rotg(backend_selector selector, sycl::buffer selector, uplo upper_lower, std::int64_t n, float alpha, sycl::buffer& a, std::int64_t lda, sycl::buffer& x, std::int64_t incx, float beta, sycl::buffer& y, std::int64_t incy) { - oneapi::math::blas::generic::MAJOR::symv(selector.get_queue(), upper_lower, n, alpha, a, lda, - x, incx, beta, y, incy); + oneapi::math::blas::generic::MAJOR::symv(selector.get_queue(), upper_lower, n, alpha, a, lda, x, + incx, beta, y, incy); } void symv(backend_selector selector, uplo upper_lower, std::int64_t n, double alpha, sycl::buffer& a, std::int64_t lda, sycl::buffer& x, std::int64_t incx, double beta, sycl::buffer& y, std::int64_t incy) { - oneapi::math::blas::generic::MAJOR::symv(selector.get_queue(), upper_lower, n, alpha, a, lda, - x, incx, beta, y, incy); + oneapi::math::blas::generic::MAJOR::symv(selector.get_queue(), upper_lower, n, alpha, a, lda, x, + incx, beta, y, incy); } void omatcopy_batch(backend_selector selector, transpose trans, std::int64_t m, std::int64_t n, float alpha, sycl::buffer& a, std::int64_t lda, std::int64_t stride_a, sycl::buffer& b, std::int64_t ldb, std::int64_t stride_b, std::int64_t batch_size) { - oneapi::math::blas::generic::MAJOR::omatcopy_batch( - selector.get_queue(), trans, m, n, alpha, a, lda, stride_a, b, ldb, stride_b, batch_size); + oneapi::math::blas::generic::MAJOR::omatcopy_batch(selector.get_queue(), trans, m, n, alpha, a, + lda, stride_a, b, ldb, stride_b, batch_size); } void omatcopy_batch(backend_selector selector, transpose trans, std::int64_t m, std::int64_t n, double alpha, sycl::buffer& a, std::int64_t lda, std::int64_t stride_a, sycl::buffer& b, std::int64_t ldb, std::int64_t stride_b, std::int64_t batch_size) { - oneapi::math::blas::generic::MAJOR::omatcopy_batch( - selector.get_queue(), trans, m, n, alpha, a, lda, stride_a, b, ldb, stride_b, batch_size); + oneapi::math::blas::generic::MAJOR::omatcopy_batch(selector.get_queue(), trans, m, n, alpha, a, + lda, stride_a, b, ldb, stride_b, batch_size); } void omatcopy_batch(backend_selector selector, transpose trans, std::int64_t m, @@ -1518,8 +1518,8 @@ void omatcopy_batch(backend_selector selector, transpose trans sycl::buffer, 1>& a, std::int64_t lda, std::int64_t stride_a, sycl::buffer, 1>& b, std::int64_t ldb, std::int64_t stride_b, std::int64_t batch_size) { - oneapi::math::blas::generic::MAJOR::omatcopy_batch( - selector.get_queue(), trans, m, n, alpha, a, lda, stride_a, b, ldb, stride_b, batch_size); + oneapi::math::blas::generic::MAJOR::omatcopy_batch(selector.get_queue(), trans, m, n, alpha, a, + lda, stride_a, b, ldb, stride_b, batch_size); } void omatcopy_batch(backend_selector selector, transpose trans, std::int64_t m, @@ -1527,38 +1527,38 @@ void omatcopy_batch(backend_selector selector, transpose trans sycl::buffer, 1>& a, std::int64_t lda, std::int64_t stride_a, sycl::buffer, 1>& b, std::int64_t ldb, std::int64_t stride_b, std::int64_t batch_size) { - oneapi::math::blas::generic::MAJOR::omatcopy_batch( - selector.get_queue(), trans, m, n, alpha, a, lda, stride_a, b, ldb, stride_b, batch_size); + oneapi::math::blas::generic::MAJOR::omatcopy_batch(selector.get_queue(), trans, m, n, alpha, a, + lda, stride_a, b, ldb, stride_b, batch_size); } void imatcopy_batch(backend_selector selector, transpose trans, std::int64_t m, std::int64_t n, float alpha, sycl::buffer& ab, std::int64_t lda, std::int64_t ldb, std::int64_t stride, std::int64_t batch_size) { - oneapi::math::blas::generic::MAJOR::imatcopy_batch(selector.get_queue(), trans, m, n, alpha, - ab, lda, ldb, stride, batch_size); + oneapi::math::blas::generic::MAJOR::imatcopy_batch(selector.get_queue(), trans, m, n, alpha, ab, + lda, ldb, stride, batch_size); } void imatcopy_batch(backend_selector selector, transpose trans, std::int64_t m, std::int64_t n, double alpha, sycl::buffer& ab, std::int64_t lda, std::int64_t ldb, std::int64_t stride, std::int64_t batch_size) { - oneapi::math::blas::generic::MAJOR::imatcopy_batch(selector.get_queue(), trans, m, n, alpha, - ab, lda, ldb, stride, batch_size); + oneapi::math::blas::generic::MAJOR::imatcopy_batch(selector.get_queue(), trans, m, n, alpha, ab, + lda, ldb, stride, batch_size); } void imatcopy_batch(backend_selector selector, transpose trans, std::int64_t m, std::int64_t n, std::complex alpha, sycl::buffer, 1>& ab, std::int64_t lda, std::int64_t ldb, std::int64_t stride, std::int64_t batch_size) { - oneapi::math::blas::generic::MAJOR::imatcopy_batch(selector.get_queue(), trans, m, n, alpha, - ab, lda, ldb, stride, batch_size); + oneapi::math::blas::generic::MAJOR::imatcopy_batch(selector.get_queue(), trans, m, n, alpha, ab, + lda, ldb, stride, batch_size); } void imatcopy_batch(backend_selector selector, transpose trans, std::int64_t m, std::int64_t n, std::complex alpha, sycl::buffer, 1>& ab, std::int64_t lda, std::int64_t ldb, std::int64_t stride, std::int64_t batch_size) { - oneapi::math::blas::generic::MAJOR::imatcopy_batch(selector.get_queue(), trans, m, n, alpha, - ab, lda, ldb, stride, batch_size); + oneapi::math::blas::generic::MAJOR::imatcopy_batch(selector.get_queue(), trans, m, n, alpha, ab, + lda, ldb, stride, batch_size); } void omatadd_batch(backend_selector selector, transpose transa, transpose transb, @@ -1567,8 +1567,8 @@ void omatadd_batch(backend_selector selector, transpose transa std::int64_t ldb, std::int64_t stride_b, sycl::buffer& c, std::int64_t ldc, std::int64_t stride_c, std::int64_t batch_size) { oneapi::math::blas::generic::MAJOR::omatadd_batch(selector.get_queue(), transa, transb, m, n, - alpha, a, lda, stride_a, beta, b, ldb, - stride_b, c, ldc, stride_c, batch_size); + alpha, a, lda, stride_a, beta, b, ldb, + stride_b, c, ldc, stride_c, batch_size); } void omatadd_batch(backend_selector selector, transpose transa, transpose transb, @@ -1577,8 +1577,8 @@ void omatadd_batch(backend_selector selector, transpose transa std::int64_t ldb, std::int64_t stride_b, sycl::buffer& c, std::int64_t ldc, std::int64_t stride_c, std::int64_t batch_size) { oneapi::math::blas::generic::MAJOR::omatadd_batch(selector.get_queue(), transa, transb, m, n, - alpha, a, lda, stride_a, beta, b, ldb, - stride_b, c, ldc, stride_c, batch_size); + alpha, a, lda, stride_a, beta, b, ldb, + stride_b, c, ldc, stride_c, batch_size); } void omatadd_batch(backend_selector selector, transpose transa, transpose transb, @@ -1588,8 +1588,8 @@ void omatadd_batch(backend_selector selector, transpose transa std::int64_t ldb, std::int64_t stride_b, sycl::buffer, 1>& c, std::int64_t ldc, std::int64_t stride_c, std::int64_t batch_size) { oneapi::math::blas::generic::MAJOR::omatadd_batch(selector.get_queue(), transa, transb, m, n, - alpha, a, lda, stride_a, beta, b, ldb, - stride_b, c, ldc, stride_c, batch_size); + alpha, a, lda, stride_a, beta, b, ldb, + stride_b, c, ldc, stride_c, batch_size); } void omatadd_batch(backend_selector selector, transpose transa, transpose transb, @@ -1600,36 +1600,36 @@ void omatadd_batch(backend_selector selector, transpose transa std::int64_t stride_b, sycl::buffer, 1>& c, std::int64_t ldc, std::int64_t stride_c, std::int64_t batch_size) { oneapi::math::blas::generic::MAJOR::omatadd_batch(selector.get_queue(), transa, transb, m, n, - alpha, a, lda, stride_a, beta, b, ldb, - stride_b, c, ldc, stride_c, batch_size); + alpha, a, lda, stride_a, beta, b, ldb, + stride_b, c, ldc, stride_c, batch_size); } void omatcopy(backend_selector selector, transpose trans, std::int64_t m, std::int64_t n, float alpha, sycl::buffer& a, std::int64_t lda, sycl::buffer& b, std::int64_t ldb) { oneapi::math::blas::generic::MAJOR::omatcopy(selector.get_queue(), trans, m, n, alpha, a, lda, - b, ldb); + b, ldb); } void omatcopy(backend_selector selector, transpose trans, std::int64_t m, std::int64_t n, double alpha, sycl::buffer& a, std::int64_t lda, sycl::buffer& b, std::int64_t ldb) { oneapi::math::blas::generic::MAJOR::omatcopy(selector.get_queue(), trans, m, n, alpha, a, lda, - b, ldb); + b, ldb); } void omatcopy(backend_selector selector, transpose trans, std::int64_t m, std::int64_t n, std::complex alpha, sycl::buffer, 1>& a, std::int64_t lda, sycl::buffer, 1>& b, std::int64_t ldb) { oneapi::math::blas::generic::MAJOR::omatcopy(selector.get_queue(), trans, m, n, alpha, a, lda, - b, ldb); + b, ldb); } void omatcopy(backend_selector selector, transpose trans, std::int64_t m, std::int64_t n, std::complex alpha, sycl::buffer, 1>& a, std::int64_t lda, sycl::buffer, 1>& b, std::int64_t ldb) { oneapi::math::blas::generic::MAJOR::omatcopy(selector.get_queue(), trans, m, n, alpha, a, lda, - b, ldb); + b, ldb); } void omatcopy2(backend_selector selector, transpose trans, std::int64_t m, @@ -1637,7 +1637,7 @@ void omatcopy2(backend_selector selector, transpose trans, std std::int64_t stridea, sycl::buffer& b, std::int64_t ldb, std::int64_t strideb) { oneapi::math::blas::generic::MAJOR::omatcopy2(selector.get_queue(), trans, m, n, alpha, a, lda, - stridea, b, ldb, strideb); + stridea, b, ldb, strideb); } void omatcopy2(backend_selector selector, transpose trans, std::int64_t m, @@ -1645,7 +1645,7 @@ void omatcopy2(backend_selector selector, transpose trans, std std::int64_t stridea, sycl::buffer& b, std::int64_t ldb, std::int64_t strideb) { oneapi::math::blas::generic::MAJOR::omatcopy2(selector.get_queue(), trans, m, n, alpha, a, lda, - stridea, b, ldb, strideb); + stridea, b, ldb, strideb); } void omatcopy2(backend_selector selector, transpose trans, std::int64_t m, @@ -1653,7 +1653,7 @@ void omatcopy2(backend_selector selector, transpose trans, std std::int64_t lda, std::int64_t stridea, sycl::buffer, 1>& b, std::int64_t ldb, std::int64_t strideb) { oneapi::math::blas::generic::MAJOR::omatcopy2(selector.get_queue(), trans, m, n, alpha, a, lda, - stridea, b, ldb, strideb); + stridea, b, ldb, strideb); } void omatcopy2(backend_selector selector, transpose trans, std::int64_t m, @@ -1661,35 +1661,35 @@ void omatcopy2(backend_selector selector, transpose trans, std std::int64_t lda, std::int64_t stridea, sycl::buffer, 1>& b, std::int64_t ldb, std::int64_t strideb) { oneapi::math::blas::generic::MAJOR::omatcopy2(selector.get_queue(), trans, m, n, alpha, a, lda, - stridea, b, ldb, strideb); + stridea, b, ldb, strideb); } void imatcopy(backend_selector selector, transpose trans, std::int64_t m, std::int64_t n, float alpha, sycl::buffer& ab, std::int64_t lda, std::int64_t ldb) { oneapi::math::blas::generic::MAJOR::imatcopy(selector.get_queue(), trans, m, n, alpha, ab, lda, - ldb); + ldb); } void imatcopy(backend_selector selector, transpose trans, std::int64_t m, std::int64_t n, double alpha, sycl::buffer& ab, std::int64_t lda, std::int64_t ldb) { oneapi::math::blas::generic::MAJOR::imatcopy(selector.get_queue(), trans, m, n, alpha, ab, lda, - ldb); + ldb); } void imatcopy(backend_selector selector, transpose trans, std::int64_t m, std::int64_t n, std::complex alpha, sycl::buffer, 1>& ab, std::int64_t lda, std::int64_t ldb) { oneapi::math::blas::generic::MAJOR::imatcopy(selector.get_queue(), trans, m, n, alpha, ab, lda, - ldb); + ldb); } void imatcopy(backend_selector selector, transpose trans, std::int64_t m, std::int64_t n, std::complex alpha, sycl::buffer, 1>& ab, std::int64_t lda, std::int64_t ldb) { oneapi::math::blas::generic::MAJOR::imatcopy(selector.get_queue(), trans, m, n, alpha, ab, lda, - ldb); + ldb); } void omatadd(backend_selector selector, transpose transa, transpose transb, @@ -1697,7 +1697,7 @@ void omatadd(backend_selector selector, transpose transa, tran std::int64_t lda, float beta, sycl::buffer& b, std::int64_t ldb, sycl::buffer& c, std::int64_t ldc) { oneapi::math::blas::generic::MAJOR::omatadd(selector.get_queue(), transa, transb, m, n, alpha, - a, lda, beta, b, ldb, c, ldc); + a, lda, beta, b, ldb, c, ldc); } void omatadd(backend_selector selector, transpose transa, transpose transb, @@ -1705,7 +1705,7 @@ void omatadd(backend_selector selector, transpose transa, tran std::int64_t lda, double beta, sycl::buffer& b, std::int64_t ldb, sycl::buffer& c, std::int64_t ldc) { oneapi::math::blas::generic::MAJOR::omatadd(selector.get_queue(), transa, transb, m, n, alpha, - a, lda, beta, b, ldb, c, ldc); + a, lda, beta, b, ldb, c, ldc); } void omatadd(backend_selector selector, transpose transa, transpose transb, @@ -1714,7 +1714,7 @@ void omatadd(backend_selector selector, transpose transa, tran sycl::buffer, 1>& b, std::int64_t ldb, sycl::buffer, 1>& c, std::int64_t ldc) { oneapi::math::blas::generic::MAJOR::omatadd(selector.get_queue(), transa, transb, m, n, alpha, - a, lda, beta, b, ldb, c, ldc); + a, lda, beta, b, ldb, c, ldc); } void omatadd(backend_selector selector, transpose transa, transpose transb, @@ -1723,7 +1723,7 @@ void omatadd(backend_selector selector, transpose transa, tran sycl::buffer, 1>& b, std::int64_t ldb, sycl::buffer, 1>& c, std::int64_t ldc) { oneapi::math::blas::generic::MAJOR::omatadd(selector.get_queue(), transa, transb, m, n, alpha, - a, lda, beta, b, ldb, c, ldc); + a, lda, beta, b, ldb, c, ldc); } // USM APIs @@ -1745,17 +1745,17 @@ sycl::event syr2(backend_selector selector, uplo upper_lower, return done; } -sycl::event scal(backend_selector selector, std::int64_t n, float alpha, - float* x, std::int64_t incx, const std::vector& dependencies) { +sycl::event scal(backend_selector selector, std::int64_t n, float alpha, float* x, + std::int64_t incx, const std::vector& dependencies) { auto done = oneapi::math::blas::generic::MAJOR::scal(selector.get_queue(), n, alpha, x, incx, - dependencies); + dependencies); return done; } sycl::event scal(backend_selector selector, std::int64_t n, double alpha, double* x, std::int64_t incx, const std::vector& dependencies) { auto done = oneapi::math::blas::generic::MAJOR::scal(selector.get_queue(), n, alpha, x, incx, - dependencies); + dependencies); return done; } @@ -1763,7 +1763,7 @@ sycl::event scal(backend_selector selector, std::int64_t n, std::complex alpha, std::complex* x, std::int64_t incx, const std::vector& dependencies) { auto done = oneapi::math::blas::generic::MAJOR::scal(selector.get_queue(), n, alpha, x, incx, - dependencies); + dependencies); return done; } @@ -1771,7 +1771,7 @@ sycl::event scal(backend_selector selector, std::int64_t n, std::complex alpha, std::complex* x, std::int64_t incx, const std::vector& dependencies) { auto done = oneapi::math::blas::generic::MAJOR::scal(selector.get_queue(), n, alpha, x, incx, - dependencies); + dependencies); return done; } @@ -1779,7 +1779,7 @@ sycl::event scal(backend_selector selector, std::int64_t n, fl std::complex* x, std::int64_t incx, const std::vector& dependencies) { auto done = oneapi::math::blas::generic::MAJOR::scal(selector.get_queue(), n, alpha, x, incx, - dependencies); + dependencies); return done; } @@ -1787,7 +1787,7 @@ sycl::event scal(backend_selector selector, std::int64_t n, do std::complex* x, std::int64_t incx, const std::vector& dependencies) { auto done = oneapi::math::blas::generic::MAJOR::scal(selector.get_queue(), n, alpha, x, incx, - dependencies); + dependencies); return done; } @@ -1829,7 +1829,7 @@ sycl::event tpmv(backend_selector selector, uplo upper_lower, diag unit_diag, std::int64_t n, const float* a, float* x, std::int64_t incx, const std::vector& dependencies) { auto done = oneapi::math::blas::generic::MAJOR::tpmv(selector.get_queue(), upper_lower, trans, - unit_diag, n, a, x, incx, dependencies); + unit_diag, n, a, x, incx, dependencies); return done; } @@ -1837,7 +1837,7 @@ sycl::event tpmv(backend_selector selector, uplo upper_lower, diag unit_diag, std::int64_t n, const double* a, double* x, std::int64_t incx, const std::vector& dependencies) { auto done = oneapi::math::blas::generic::MAJOR::tpmv(selector.get_queue(), upper_lower, trans, - unit_diag, n, a, x, incx, dependencies); + unit_diag, n, a, x, incx, dependencies); return done; } @@ -1846,7 +1846,7 @@ sycl::event tpmv(backend_selector selector, uplo upper_lower, std::complex* x, std::int64_t incx, const std::vector& dependencies) { auto done = oneapi::math::blas::generic::MAJOR::tpmv(selector.get_queue(), upper_lower, trans, - unit_diag, n, a, x, incx, dependencies); + unit_diag, n, a, x, incx, dependencies); return done; } @@ -1855,23 +1855,23 @@ sycl::event tpmv(backend_selector selector, uplo upper_lower, std::complex* x, std::int64_t incx, const std::vector& dependencies) { auto done = oneapi::math::blas::generic::MAJOR::tpmv(selector.get_queue(), upper_lower, trans, - unit_diag, n, a, x, incx, dependencies); + unit_diag, n, a, x, incx, dependencies); return done; } sycl::event spr(backend_selector selector, uplo upper_lower, std::int64_t n, float alpha, const float* x, std::int64_t incx, float* a, const std::vector& dependencies) { - auto done = oneapi::math::blas::generic::MAJOR::spr(selector.get_queue(), upper_lower, n, - alpha, x, incx, a, dependencies); + auto done = oneapi::math::blas::generic::MAJOR::spr(selector.get_queue(), upper_lower, n, alpha, + x, incx, a, dependencies); return done; } sycl::event spr(backend_selector selector, uplo upper_lower, std::int64_t n, double alpha, const double* x, std::int64_t incx, double* a, const std::vector& dependencies) { - auto done = oneapi::math::blas::generic::MAJOR::spr(selector.get_queue(), upper_lower, n, - alpha, x, incx, a, dependencies); + auto done = oneapi::math::blas::generic::MAJOR::spr(selector.get_queue(), upper_lower, n, alpha, + x, incx, a, dependencies); return done; } @@ -2050,7 +2050,7 @@ sycl::event hbmv(backend_selector selector, uplo upper_lower, const std::vector& dependencies) { auto done = oneapi::math::blas::generic::MAJOR::hbmv(selector.get_queue(), upper_lower, n, k, alpha, a, - lda, x, incx, beta, y, incy, dependencies); + lda, x, incx, beta, y, incy, dependencies); return done; } @@ -2061,15 +2061,15 @@ sycl::event hbmv(backend_selector selector, uplo upper_lower, const std::vector& dependencies) { auto done = oneapi::math::blas::generic::MAJOR::hbmv(selector.get_queue(), upper_lower, n, k, alpha, a, - lda, x, incx, beta, y, incy, dependencies); + lda, x, incx, beta, y, incy, dependencies); return done; } -sycl::event rot(backend_selector selector, std::int64_t n, - std::complex* x, std::int64_t incx, std::complex* y, - std::int64_t incy, float c, float s, const std::vector& dependencies) { +sycl::event rot(backend_selector selector, std::int64_t n, std::complex* x, + std::int64_t incx, std::complex* y, std::int64_t incy, float c, float s, + const std::vector& dependencies) { auto done = oneapi::math::blas::generic::MAJOR::rot(selector.get_queue(), n, x, incx, y, incy, - c, s, dependencies); + c, s, dependencies); return done; } @@ -2078,7 +2078,7 @@ sycl::event rot(backend_selector selector, std::int64_t n, std::int64_t incy, double c, double s, const std::vector& dependencies) { auto done = oneapi::math::blas::generic::MAJOR::rot(selector.get_queue(), n, x, incx, y, incy, - c, s, dependencies); + c, s, dependencies); return done; } @@ -2086,7 +2086,7 @@ sycl::event rot(backend_selector selector, std::int64_t n, flo std::int64_t incx, float* y, std::int64_t incy, float c, float s, const std::vector& dependencies) { auto done = oneapi::math::blas::generic::MAJOR::rot(selector.get_queue(), n, x, incx, y, incy, - c, s, dependencies); + c, s, dependencies); return done; } @@ -2094,23 +2094,23 @@ sycl::event rot(backend_selector selector, std::int64_t n, dou std::int64_t incx, double* y, std::int64_t incy, double c, double s, const std::vector& dependencies) { auto done = oneapi::math::blas::generic::MAJOR::rot(selector.get_queue(), n, x, incx, y, incy, - c, s, dependencies); + c, s, dependencies); return done; } sycl::event axpy(backend_selector selector, std::int64_t n, float alpha, const float* x, std::int64_t incx, float* y, std::int64_t incy, const std::vector& dependencies) { - auto done = oneapi::math::blas::generic::MAJOR::axpy(selector.get_queue(), n, alpha, x, incx, - y, incy, dependencies); + auto done = oneapi::math::blas::generic::MAJOR::axpy(selector.get_queue(), n, alpha, x, incx, y, + incy, dependencies); return done; } sycl::event axpy(backend_selector selector, std::int64_t n, double alpha, const double* x, std::int64_t incx, double* y, std::int64_t incy, const std::vector& dependencies) { - auto done = oneapi::math::blas::generic::MAJOR::axpy(selector.get_queue(), n, alpha, x, incx, - y, incy, dependencies); + auto done = oneapi::math::blas::generic::MAJOR::axpy(selector.get_queue(), n, alpha, x, incx, y, + incy, dependencies); return done; } @@ -2118,8 +2118,8 @@ sycl::event axpy(backend_selector selector, std::int64_t n, std::complex alpha, const std::complex* x, std::int64_t incx, std::complex* y, std::int64_t incy, const std::vector& dependencies) { - auto done = oneapi::math::blas::generic::MAJOR::axpy(selector.get_queue(), n, alpha, x, incx, - y, incy, dependencies); + auto done = oneapi::math::blas::generic::MAJOR::axpy(selector.get_queue(), n, alpha, x, incx, y, + incy, dependencies); return done; } @@ -2127,8 +2127,8 @@ sycl::event axpy(backend_selector selector, std::int64_t n, std::complex alpha, const std::complex* x, std::int64_t incx, std::complex* y, std::int64_t incy, const std::vector& dependencies) { - auto done = oneapi::math::blas::generic::MAJOR::axpy(selector.get_queue(), n, alpha, x, incx, - y, incy, dependencies); + auto done = oneapi::math::blas::generic::MAJOR::axpy(selector.get_queue(), n, alpha, x, incx, y, + incy, dependencies); return done; } @@ -2175,8 +2175,8 @@ sycl::event axpy_batch(backend_selector selector, std::int64_t std::int64_t incy, std::int64_t stridey, std::int64_t batch_size, const std::vector& dependencies) { auto done = oneapi::math::blas::generic::MAJOR::axpy_batch(selector.get_queue(), n, alpha, x, - incx, stridex, y, incy, stridey, - batch_size, dependencies); + incx, stridex, y, incy, stridey, + batch_size, dependencies); return done; } @@ -2185,8 +2185,8 @@ sycl::event axpy_batch(backend_selector selector, std::int64_t std::int64_t incy, std::int64_t stridey, std::int64_t batch_size, const std::vector& dependencies) { auto done = oneapi::math::blas::generic::MAJOR::axpy_batch(selector.get_queue(), n, alpha, x, - incx, stridex, y, incy, stridey, - batch_size, dependencies); + incx, stridex, y, incy, stridey, + batch_size, dependencies); return done; } @@ -2196,8 +2196,8 @@ sycl::event axpy_batch(backend_selector selector, std::int64_t std::int64_t stridey, std::int64_t batch_size, const std::vector& dependencies) { auto done = oneapi::math::blas::generic::MAJOR::axpy_batch(selector.get_queue(), n, alpha, x, - incx, stridex, y, incy, stridey, - batch_size, dependencies); + incx, stridex, y, incy, stridey, + batch_size, dependencies); return done; } @@ -2207,8 +2207,8 @@ sycl::event axpy_batch(backend_selector selector, std::int64_t std::int64_t stridey, std::int64_t batch_size, const std::vector& dependencies) { auto done = oneapi::math::blas::generic::MAJOR::axpy_batch(selector.get_queue(), n, alpha, x, - incx, stridex, y, incy, stridey, - batch_size, dependencies); + incx, stridex, y, incy, stridey, + batch_size, dependencies); return done; } @@ -2216,7 +2216,7 @@ sycl::event axpby(backend_selector selector, std::int64_t n, f const float* x, std::int64_t incx, const float beta, float* y, std::int64_t incy, const std::vector& dependencies) { auto done = oneapi::math::blas::generic::MAJOR::axpby(selector.get_queue(), n, alpha, x, incx, - beta, y, incy, dependencies); + beta, y, incy, dependencies); return done; } @@ -2224,7 +2224,7 @@ sycl::event axpby(backend_selector selector, std::int64_t n, d const double* x, std::int64_t incx, const double beta, double* y, std::int64_t incy, const std::vector& dependencies) { auto done = oneapi::math::blas::generic::MAJOR::axpby(selector.get_queue(), n, alpha, x, incx, - beta, y, incy, dependencies); + beta, y, incy, dependencies); return done; } @@ -2233,7 +2233,7 @@ sycl::event axpby(backend_selector selector, std::int64_t n, const std::complex beta, std::complex* y, std::int64_t incy, const std::vector& dependencies) { auto done = oneapi::math::blas::generic::MAJOR::axpby(selector.get_queue(), n, alpha, x, incx, - beta, y, incy, dependencies); + beta, y, incy, dependencies); return done; } @@ -2242,7 +2242,7 @@ sycl::event axpby(backend_selector selector, std::int64_t n, const std::complex beta, std::complex* y, std::int64_t incy, const std::vector& dependencies) { auto done = oneapi::math::blas::generic::MAJOR::axpby(selector.get_queue(), n, alpha, x, incx, - beta, y, incy, dependencies); + beta, y, incy, dependencies); return done; } @@ -2250,8 +2250,8 @@ sycl::event gerc(backend_selector selector, std::int64_t m, st std::complex alpha, const std::complex* x, std::int64_t incx, const std::complex* y, std::int64_t incy, std::complex* a, std::int64_t lda, const std::vector& dependencies) { - auto done = oneapi::math::blas::generic::MAJOR::gerc(selector.get_queue(), m, n, alpha, x, - incx, y, incy, a, lda, dependencies); + auto done = oneapi::math::blas::generic::MAJOR::gerc(selector.get_queue(), m, n, alpha, x, incx, + y, incy, a, lda, dependencies); return done; } @@ -2259,8 +2259,8 @@ sycl::event gerc(backend_selector selector, std::int64_t m, st std::complex alpha, const std::complex* x, std::int64_t incx, const std::complex* y, std::int64_t incy, std::complex* a, std::int64_t lda, const std::vector& dependencies) { - auto done = oneapi::math::blas::generic::MAJOR::gerc(selector.get_queue(), m, n, alpha, x, - incx, y, incy, a, lda, dependencies); + auto done = oneapi::math::blas::generic::MAJOR::gerc(selector.get_queue(), m, n, alpha, x, incx, + y, incy, a, lda, dependencies); return done; } @@ -2269,8 +2269,8 @@ sycl::event syr2k(backend_selector selector, uplo upper_lower, const float* b, std::int64_t ldb, float beta, float* c, std::int64_t ldc, const std::vector& dependencies) { auto done = oneapi::math::blas::generic::MAJOR::syr2k(selector.get_queue(), upper_lower, trans, - n, k, alpha, a, lda, b, ldb, beta, c, - ldc, dependencies); + n, k, alpha, a, lda, b, ldb, beta, c, ldc, + dependencies); return done; } @@ -2279,8 +2279,8 @@ sycl::event syr2k(backend_selector selector, uplo upper_lower, const double* b, std::int64_t ldb, double beta, double* c, std::int64_t ldc, const std::vector& dependencies) { auto done = oneapi::math::blas::generic::MAJOR::syr2k(selector.get_queue(), upper_lower, trans, - n, k, alpha, a, lda, b, ldb, beta, c, - ldc, dependencies); + n, k, alpha, a, lda, b, ldb, beta, c, ldc, + dependencies); return done; } @@ -2290,8 +2290,8 @@ sycl::event syr2k(backend_selector selector, uplo upper_lower, std::int64_t ldb, std::complex beta, std::complex* c, std::int64_t ldc, const std::vector& dependencies) { auto done = oneapi::math::blas::generic::MAJOR::syr2k(selector.get_queue(), upper_lower, trans, - n, k, alpha, a, lda, b, ldb, beta, c, - ldc, dependencies); + n, k, alpha, a, lda, b, ldb, beta, c, ldc, + dependencies); return done; } @@ -2301,8 +2301,8 @@ sycl::event syr2k(backend_selector selector, uplo upper_lower, std::int64_t ldb, std::complex beta, std::complex* c, std::int64_t ldc, const std::vector& dependencies) { auto done = oneapi::math::blas::generic::MAJOR::syr2k(selector.get_queue(), upper_lower, trans, - n, k, alpha, a, lda, b, ldb, beta, c, - ldc, dependencies); + n, k, alpha, a, lda, b, ldb, beta, c, ldc, + dependencies); return done; } @@ -2344,9 +2344,9 @@ sycl::event gemv(backend_selector selector, transpose trans, s return done; } -sycl::event gemv_batch(backend_selector selector, transpose trans, - std::int64_t m, std::int64_t n, float alpha, const float* a, - std::int64_t lda, std::int64_t stridea, const float* x, std::int64_t incx, +sycl::event gemv_batch(backend_selector selector, transpose trans, std::int64_t m, + std::int64_t n, float alpha, const float* a, std::int64_t lda, + std::int64_t stridea, const float* x, std::int64_t incx, std::int64_t stridex, float beta, float* y, std::int64_t incy, std::int64_t stridey, std::int64_t batch_size, const std::vector& dependencies) { @@ -2356,9 +2356,9 @@ sycl::event gemv_batch(backend_selector selector, transpose tr return done; } -sycl::event gemv_batch(backend_selector selector, transpose trans, - std::int64_t m, std::int64_t n, double alpha, const double* a, - std::int64_t lda, std::int64_t stridea, const double* x, std::int64_t incx, +sycl::event gemv_batch(backend_selector selector, transpose trans, std::int64_t m, + std::int64_t n, double alpha, const double* a, std::int64_t lda, + std::int64_t stridea, const double* x, std::int64_t incx, std::int64_t stridex, double beta, double* y, std::int64_t incy, std::int64_t stridey, std::int64_t batch_size, const std::vector& dependencies) { @@ -2368,26 +2368,24 @@ sycl::event gemv_batch(backend_selector selector, transpose tr return done; } -sycl::event gemv_batch(backend_selector selector, transpose trans, - std::int64_t m, std::int64_t n, std::complex alpha, - const std::complex* a, std::int64_t lda, std::int64_t stridea, - const std::complex* x, std::int64_t incx, std::int64_t stridex, - std::complex beta, std::complex* y, std::int64_t incy, - std::int64_t stridey, std::int64_t batch_size, - const std::vector& dependencies) { +sycl::event gemv_batch(backend_selector selector, transpose trans, std::int64_t m, + std::int64_t n, std::complex alpha, const std::complex* a, + std::int64_t lda, std::int64_t stridea, const std::complex* x, + std::int64_t incx, std::int64_t stridex, std::complex beta, + std::complex* y, std::int64_t incy, std::int64_t stridey, + std::int64_t batch_size, const std::vector& dependencies) { auto done = oneapi::math::blas::generic::MAJOR::gemv_batch( selector.get_queue(), trans, m, n, alpha, a, lda, stridea, x, incx, stridex, beta, y, incy, stridey, batch_size, dependencies); return done; } -sycl::event gemv_batch(backend_selector selector, transpose trans, - std::int64_t m, std::int64_t n, std::complex alpha, - const std::complex* a, std::int64_t lda, std::int64_t stridea, - const std::complex* x, std::int64_t incx, std::int64_t stridex, - std::complex beta, std::complex* y, std::int64_t incy, - std::int64_t stridey, std::int64_t batch_size, - const std::vector& dependencies) { +sycl::event gemv_batch(backend_selector selector, transpose trans, std::int64_t m, + std::int64_t n, std::complex alpha, const std::complex* a, + std::int64_t lda, std::int64_t stridea, const std::complex* x, + std::int64_t incx, std::int64_t stridex, std::complex beta, + std::complex* y, std::int64_t incy, std::int64_t stridey, + std::int64_t batch_size, const std::vector& dependencies) { auto done = oneapi::math::blas::generic::MAJOR::gemv_batch( selector.get_queue(), trans, m, n, alpha, a, lda, stridea, x, incx, stridex, beta, y, incy, stridey, batch_size, dependencies); @@ -2441,33 +2439,33 @@ sycl::event gemv_batch(backend_selector selector, transpose* t return done; } -sycl::event dgmm_batch(backend_selector selector, side left_right, - std::int64_t m, std::int64_t n, const float* a, std::int64_t lda, - std::int64_t stridea, const float* x, std::int64_t incx, - std::int64_t stridex, float* c, std::int64_t ldc, std::int64_t stridec, - std::int64_t batch_size, const std::vector& dependencies) { +sycl::event dgmm_batch(backend_selector selector, side left_right, std::int64_t m, + std::int64_t n, const float* a, std::int64_t lda, std::int64_t stridea, + const float* x, std::int64_t incx, std::int64_t stridex, float* c, + std::int64_t ldc, std::int64_t stridec, std::int64_t batch_size, + const std::vector& dependencies) { auto done = oneapi::math::blas::generic::MAJOR::dgmm_batch( selector.get_queue(), left_right, m, n, a, lda, stridea, x, incx, stridex, c, ldc, stridec, batch_size, dependencies); return done; } -sycl::event dgmm_batch(backend_selector selector, side left_right, - std::int64_t m, std::int64_t n, const double* a, std::int64_t lda, - std::int64_t stridea, const double* x, std::int64_t incx, - std::int64_t stridex, double* c, std::int64_t ldc, std::int64_t stridec, - std::int64_t batch_size, const std::vector& dependencies) { +sycl::event dgmm_batch(backend_selector selector, side left_right, std::int64_t m, + std::int64_t n, const double* a, std::int64_t lda, std::int64_t stridea, + const double* x, std::int64_t incx, std::int64_t stridex, double* c, + std::int64_t ldc, std::int64_t stridec, std::int64_t batch_size, + const std::vector& dependencies) { auto done = oneapi::math::blas::generic::MAJOR::dgmm_batch( selector.get_queue(), left_right, m, n, a, lda, stridea, x, incx, stridex, c, ldc, stridec, batch_size, dependencies); return done; } -sycl::event dgmm_batch(backend_selector selector, side left_right, - std::int64_t m, std::int64_t n, const std::complex* a, - std::int64_t lda, std::int64_t stridea, const std::complex* x, - std::int64_t incx, std::int64_t stridex, std::complex* c, - std::int64_t ldc, std::int64_t stridec, std::int64_t batch_size, +sycl::event dgmm_batch(backend_selector selector, side left_right, std::int64_t m, + std::int64_t n, const std::complex* a, std::int64_t lda, + std::int64_t stridea, const std::complex* x, std::int64_t incx, + std::int64_t stridex, std::complex* c, std::int64_t ldc, + std::int64_t stridec, std::int64_t batch_size, const std::vector& dependencies) { auto done = oneapi::math::blas::generic::MAJOR::dgmm_batch( selector.get_queue(), left_right, m, n, a, lda, stridea, x, incx, stridex, c, ldc, stridec, @@ -2475,11 +2473,11 @@ sycl::event dgmm_batch(backend_selector selector, side left_ri return done; } -sycl::event dgmm_batch(backend_selector selector, side left_right, - std::int64_t m, std::int64_t n, const std::complex* a, - std::int64_t lda, std::int64_t stridea, const std::complex* x, - std::int64_t incx, std::int64_t stridex, std::complex* c, - std::int64_t ldc, std::int64_t stridec, std::int64_t batch_size, +sycl::event dgmm_batch(backend_selector selector, side left_right, std::int64_t m, + std::int64_t n, const std::complex* a, std::int64_t lda, + std::int64_t stridea, const std::complex* x, std::int64_t incx, + std::int64_t stridex, std::complex* c, std::int64_t ldc, + std::int64_t stridec, std::int64_t batch_size, const std::vector& dependencies) { auto done = oneapi::math::blas::generic::MAJOR::dgmm_batch( selector.get_queue(), left_right, m, n, a, lda, stridea, x, incx, stridex, c, ldc, stridec, @@ -2535,8 +2533,8 @@ sycl::event her(backend_selector selector, uplo upper_lower, s float alpha, const std::complex* x, std::int64_t incx, std::complex* a, std::int64_t lda, const std::vector& dependencies) { - auto done = oneapi::math::blas::generic::MAJOR::her(selector.get_queue(), upper_lower, n, - alpha, x, incx, a, lda, dependencies); + auto done = oneapi::math::blas::generic::MAJOR::her(selector.get_queue(), upper_lower, n, alpha, + x, incx, a, lda, dependencies); return done; } @@ -2544,24 +2542,24 @@ sycl::event her(backend_selector selector, uplo upper_lower, s double alpha, const std::complex* x, std::int64_t incx, std::complex* a, std::int64_t lda, const std::vector& dependencies) { - auto done = oneapi::math::blas::generic::MAJOR::her(selector.get_queue(), upper_lower, n, - alpha, x, incx, a, lda, dependencies); + auto done = oneapi::math::blas::generic::MAJOR::her(selector.get_queue(), upper_lower, n, alpha, + x, incx, a, lda, dependencies); return done; } sycl::event hpr(backend_selector selector, uplo upper_lower, std::int64_t n, float alpha, const std::complex* x, std::int64_t incx, std::complex* a, const std::vector& dependencies) { - auto done = oneapi::math::blas::generic::MAJOR::hpr(selector.get_queue(), upper_lower, n, - alpha, x, incx, a, dependencies); + auto done = oneapi::math::blas::generic::MAJOR::hpr(selector.get_queue(), upper_lower, n, alpha, + x, incx, a, dependencies); return done; } sycl::event hpr(backend_selector selector, uplo upper_lower, std::int64_t n, double alpha, const std::complex* x, std::int64_t incx, std::complex* a, const std::vector& dependencies) { - auto done = oneapi::math::blas::generic::MAJOR::hpr(selector.get_queue(), upper_lower, n, - alpha, x, incx, a, dependencies); + auto done = oneapi::math::blas::generic::MAJOR::hpr(selector.get_queue(), upper_lower, n, alpha, + x, incx, a, dependencies); return done; } @@ -2569,7 +2567,7 @@ sycl::event iamin(backend_selector selector, std::int64_t n, c std::int64_t incx, std::int64_t* result, const std::vector& dependencies) { auto done = oneapi::math::blas::generic::MAJOR::iamin(selector.get_queue(), n, x, incx, result, - dependencies); + dependencies); return done; } @@ -2577,7 +2575,7 @@ sycl::event iamin(backend_selector selector, std::int64_t n, c std::int64_t incx, std::int64_t* result, const std::vector& dependencies) { auto done = oneapi::math::blas::generic::MAJOR::iamin(selector.get_queue(), n, x, incx, result, - dependencies); + dependencies); return done; } @@ -2585,7 +2583,7 @@ sycl::event iamin(backend_selector selector, std::int64_t n, const std::complex* x, std::int64_t incx, std::int64_t* result, const std::vector& dependencies) { auto done = oneapi::math::blas::generic::MAJOR::iamin(selector.get_queue(), n, x, incx, result, - dependencies); + dependencies); return done; } @@ -2593,7 +2591,7 @@ sycl::event iamin(backend_selector selector, std::int64_t n, const std::complex* x, std::int64_t incx, std::int64_t* result, const std::vector& dependencies) { auto done = oneapi::math::blas::generic::MAJOR::iamin(selector.get_queue(), n, x, incx, result, - dependencies); + dependencies); return done; } @@ -2813,7 +2811,7 @@ sycl::event swap(backend_selector selector, std::int64_t n, fl std::int64_t incx, float* y, std::int64_t incy, const std::vector& dependencies) { auto done = oneapi::math::blas::generic::MAJOR::swap(selector.get_queue(), n, x, incx, y, incy, - dependencies); + dependencies); return done; } @@ -2821,7 +2819,7 @@ sycl::event swap(backend_selector selector, std::int64_t n, do std::int64_t incx, double* y, std::int64_t incy, const std::vector& dependencies) { auto done = oneapi::math::blas::generic::MAJOR::swap(selector.get_queue(), n, x, incx, y, incy, - dependencies); + dependencies); return done; } @@ -2829,7 +2827,7 @@ sycl::event swap(backend_selector selector, std::int64_t n, std::complex* x, std::int64_t incx, std::complex* y, std::int64_t incy, const std::vector& dependencies) { auto done = oneapi::math::blas::generic::MAJOR::swap(selector.get_queue(), n, x, incx, y, incy, - dependencies); + dependencies); return done; } @@ -2837,7 +2835,7 @@ sycl::event swap(backend_selector selector, std::int64_t n, std::complex* x, std::int64_t incx, std::complex* y, std::int64_t incy, const std::vector& dependencies) { auto done = oneapi::math::blas::generic::MAJOR::swap(selector.get_queue(), n, x, incx, y, incy, - dependencies); + dependencies); return done; } @@ -2845,8 +2843,8 @@ sycl::event geru(backend_selector selector, std::int64_t m, st std::complex alpha, const std::complex* x, std::int64_t incx, const std::complex* y, std::int64_t incy, std::complex* a, std::int64_t lda, const std::vector& dependencies) { - auto done = oneapi::math::blas::generic::MAJOR::geru(selector.get_queue(), m, n, alpha, x, - incx, y, incy, a, lda, dependencies); + auto done = oneapi::math::blas::generic::MAJOR::geru(selector.get_queue(), m, n, alpha, x, incx, + y, incy, a, lda, dependencies); return done; } @@ -2854,8 +2852,8 @@ sycl::event geru(backend_selector selector, std::int64_t m, st std::complex alpha, const std::complex* x, std::int64_t incx, const std::complex* y, std::int64_t incy, std::complex* a, std::int64_t lda, const std::vector& dependencies) { - auto done = oneapi::math::blas::generic::MAJOR::geru(selector.get_queue(), m, n, alpha, x, - incx, y, incy, a, lda, dependencies); + auto done = oneapi::math::blas::generic::MAJOR::geru(selector.get_queue(), m, n, alpha, x, incx, + y, incy, a, lda, dependencies); return done; } @@ -2863,7 +2861,7 @@ sycl::event nrm2(backend_selector selector, std::int64_t n, const std::complex* x, std::int64_t incx, float* result, const std::vector& dependencies) { auto done = oneapi::math::blas::generic::MAJOR::nrm2(selector.get_queue(), n, x, incx, result, - dependencies); + dependencies); return done; } @@ -2871,21 +2869,21 @@ sycl::event nrm2(backend_selector selector, std::int64_t n, const std::complex* x, std::int64_t incx, double* result, const std::vector& dependencies) { auto done = oneapi::math::blas::generic::MAJOR::nrm2(selector.get_queue(), n, x, incx, result, - dependencies); + dependencies); return done; } sycl::event nrm2(backend_selector selector, std::int64_t n, const float* x, std::int64_t incx, float* result, const std::vector& dependencies) { auto done = oneapi::math::blas::generic::MAJOR::nrm2(selector.get_queue(), n, x, incx, result, - dependencies); + dependencies); return done; } sycl::event nrm2(backend_selector selector, std::int64_t n, const double* x, std::int64_t incx, double* result, const std::vector& dependencies) { auto done = oneapi::math::blas::generic::MAJOR::nrm2(selector.get_queue(), n, x, incx, result, - dependencies); + dependencies); return done; } @@ -2893,9 +2891,9 @@ sycl::event gemm(backend_selector selector, transpose transa, std::int64_t m, std::int64_t n, std::int64_t k, float alpha, const float* a, std::int64_t lda, const float* b, std::int64_t ldb, float beta, float* c, std::int64_t ldc, const std::vector& dependencies) { - auto done = oneapi::math::blas::generic::MAJOR::gemm(selector.get_queue(), transa, transb, m, - n, k, alpha, a, lda, b, ldb, beta, c, ldc, - dependencies); + auto done = + oneapi::math::blas::generic::MAJOR::gemm(selector.get_queue(), transa, transb, m, n, k, + alpha, a, lda, b, ldb, beta, c, ldc, dependencies); return done; } @@ -2903,9 +2901,9 @@ sycl::event gemm(backend_selector selector, transpose transa, std::int64_t m, std::int64_t n, std::int64_t k, double alpha, const double* a, std::int64_t lda, const double* b, std::int64_t ldb, double beta, double* c, std::int64_t ldc, const std::vector& dependencies) { - auto done = oneapi::math::blas::generic::MAJOR::gemm(selector.get_queue(), transa, transb, m, - n, k, alpha, a, lda, b, ldb, beta, c, ldc, - dependencies); + auto done = + oneapi::math::blas::generic::MAJOR::gemm(selector.get_queue(), transa, transb, m, n, k, + alpha, a, lda, b, ldb, beta, c, ldc, dependencies); return done; } @@ -2914,9 +2912,9 @@ sycl::event gemm(backend_selector selector, transpose transa, const std::complex* a, std::int64_t lda, const std::complex* b, std::int64_t ldb, std::complex beta, std::complex* c, std::int64_t ldc, const std::vector& dependencies) { - auto done = oneapi::math::blas::generic::MAJOR::gemm(selector.get_queue(), transa, transb, m, - n, k, alpha, a, lda, b, ldb, beta, c, ldc, - dependencies); + auto done = + oneapi::math::blas::generic::MAJOR::gemm(selector.get_queue(), transa, transb, m, n, k, + alpha, a, lda, b, ldb, beta, c, ldc, dependencies); return done; } @@ -2925,9 +2923,9 @@ sycl::event gemm(backend_selector selector, transpose transa, const std::complex* a, std::int64_t lda, const std::complex* b, std::int64_t ldb, std::complex beta, std::complex* c, std::int64_t ldc, const std::vector& dependencies) { - auto done = oneapi::math::blas::generic::MAJOR::gemm(selector.get_queue(), transa, transb, m, - n, k, alpha, a, lda, b, ldb, beta, c, ldc, - dependencies); + auto done = + oneapi::math::blas::generic::MAJOR::gemm(selector.get_queue(), transa, transb, m, n, k, + alpha, a, lda, b, ldb, beta, c, ldc, dependencies); return done; } @@ -2936,9 +2934,9 @@ sycl::event gemm(backend_selector selector, transpose transa, const sycl::half* a, std::int64_t lda, const sycl::half* b, std::int64_t ldb, sycl::half beta, sycl::half* c, std::int64_t ldc, const std::vector& dependencies) { - auto done = oneapi::math::blas::generic::MAJOR::gemm(selector.get_queue(), transa, transb, m, - n, k, alpha, a, lda, b, ldb, beta, c, ldc, - dependencies); + auto done = + oneapi::math::blas::generic::MAJOR::gemm(selector.get_queue(), transa, transb, m, n, k, + alpha, a, lda, b, ldb, beta, c, ldc, dependencies); return done; } @@ -2946,9 +2944,9 @@ sycl::event gemm(backend_selector selector, transpose transa, std::int64_t m, std::int64_t n, std::int64_t k, float alpha, const sycl::half* a, std::int64_t lda, const sycl::half* b, std::int64_t ldb, float beta, float* c, std::int64_t ldc, const std::vector& dependencies) { - auto done = oneapi::math::blas::generic::MAJOR::gemm(selector.get_queue(), transa, transb, m, - n, k, alpha, a, lda, b, ldb, beta, c, ldc, - dependencies); + auto done = + oneapi::math::blas::generic::MAJOR::gemm(selector.get_queue(), transa, transb, m, n, k, + alpha, a, lda, b, ldb, beta, c, ldc, dependencies); return done; } @@ -2956,9 +2954,9 @@ sycl::event gemm(backend_selector selector, transpose transa, std::int64_t m, std::int64_t n, std::int64_t k, float alpha, const bfloat16* a, std::int64_t lda, const bfloat16* b, std::int64_t ldb, float beta, float* c, std::int64_t ldc, const std::vector& dependencies) { - auto done = oneapi::math::blas::generic::MAJOR::gemm(selector.get_queue(), transa, transb, m, - n, k, alpha, a, lda, b, ldb, beta, c, ldc, - dependencies); + auto done = + oneapi::math::blas::generic::MAJOR::gemm(selector.get_queue(), transa, transb, m, n, k, + alpha, a, lda, b, ldb, beta, c, ldc, dependencies); return done; } @@ -3032,7 +3030,7 @@ sycl::event ger(backend_selector selector, std::int64_t m, std float alpha, const float* x, std::int64_t incx, const float* y, std::int64_t incy, float* a, std::int64_t lda, const std::vector& dependencies) { auto done = oneapi::math::blas::generic::MAJOR::ger(selector.get_queue(), m, n, alpha, x, incx, - y, incy, a, lda, dependencies); + y, incy, a, lda, dependencies); return done; } @@ -3041,7 +3039,7 @@ sycl::event ger(backend_selector selector, std::int64_t m, std std::int64_t incy, double* a, std::int64_t lda, const std::vector& dependencies) { auto done = oneapi::math::blas::generic::MAJOR::ger(selector.get_queue(), m, n, alpha, x, incx, - y, incy, a, lda, dependencies); + y, incy, a, lda, dependencies); return done; } @@ -3050,8 +3048,8 @@ sycl::event trsm(backend_selector selector, side left_right, u const float* a, std::int64_t lda, float* b, std::int64_t ldb, const std::vector& dependencies) { auto done = oneapi::math::blas::generic::MAJOR::trsm(selector.get_queue(), left_right, - upper_lower, trans, unit_diag, m, n, - alpha, a, lda, b, ldb, dependencies); + upper_lower, trans, unit_diag, m, n, alpha, + a, lda, b, ldb, dependencies); return done; } @@ -3060,8 +3058,8 @@ sycl::event trsm(backend_selector selector, side left_right, u const double* a, std::int64_t lda, double* b, std::int64_t ldb, const std::vector& dependencies) { auto done = oneapi::math::blas::generic::MAJOR::trsm(selector.get_queue(), left_right, - upper_lower, trans, unit_diag, m, n, - alpha, a, lda, b, ldb, dependencies); + upper_lower, trans, unit_diag, m, n, alpha, + a, lda, b, ldb, dependencies); return done; } @@ -3071,8 +3069,8 @@ sycl::event trsm(backend_selector selector, side left_right, u std::complex* b, std::int64_t ldb, const std::vector& dependencies) { auto done = oneapi::math::blas::generic::MAJOR::trsm(selector.get_queue(), left_right, - upper_lower, trans, unit_diag, m, n, - alpha, a, lda, b, ldb, dependencies); + upper_lower, trans, unit_diag, m, n, alpha, + a, lda, b, ldb, dependencies); return done; } @@ -3082,8 +3080,8 @@ sycl::event trsm(backend_selector selector, side left_right, u std::complex* b, std::int64_t ldb, const std::vector& dependencies) { auto done = oneapi::math::blas::generic::MAJOR::trsm(selector.get_queue(), left_right, - upper_lower, trans, unit_diag, m, n, - alpha, a, lda, b, ldb, dependencies); + upper_lower, trans, unit_diag, m, n, alpha, + a, lda, b, ldb, dependencies); return done; } @@ -3184,7 +3182,7 @@ sycl::event dotu(backend_selector selector, std::int64_t n, std::int64_t incy, std::complex* result, const std::vector& dependencies) { auto done = oneapi::math::blas::generic::MAJOR::dotu(selector.get_queue(), n, x, incx, y, incy, - result, dependencies); + result, dependencies); return done; } @@ -3193,7 +3191,7 @@ sycl::event dotu(backend_selector selector, std::int64_t n, std::int64_t incy, std::complex* result, const std::vector& dependencies) { auto done = oneapi::math::blas::generic::MAJOR::dotu(selector.get_queue(), n, x, incx, y, incy, - result, dependencies); + result, dependencies); return done; } @@ -3203,8 +3201,8 @@ sycl::event hemm(backend_selector selector, side left_right, u std::int64_t ldb, std::complex beta, std::complex* c, std::int64_t ldc, const std::vector& dependencies) { auto done = oneapi::math::blas::generic::MAJOR::hemm(selector.get_queue(), left_right, - upper_lower, m, n, alpha, a, lda, b, ldb, - beta, c, ldc, dependencies); + upper_lower, m, n, alpha, a, lda, b, ldb, + beta, c, ldc, dependencies); return done; } @@ -3214,8 +3212,8 @@ sycl::event hemm(backend_selector selector, side left_right, u std::int64_t ldb, std::complex beta, std::complex* c, std::int64_t ldc, const std::vector& dependencies) { auto done = oneapi::math::blas::generic::MAJOR::hemm(selector.get_queue(), left_right, - upper_lower, m, n, alpha, a, lda, b, ldb, - beta, c, ldc, dependencies); + upper_lower, m, n, alpha, a, lda, b, ldb, + beta, c, ldc, dependencies); return done; } @@ -3224,7 +3222,7 @@ sycl::event hpr2(backend_selector selector, uplo upper_lower, const std::complex* y, std::int64_t incy, std::complex* a, const std::vector& dependencies) { auto done = oneapi::math::blas::generic::MAJOR::hpr2(selector.get_queue(), upper_lower, n, - alpha, x, incx, y, incy, a, dependencies); + alpha, x, incx, y, incy, a, dependencies); return done; } @@ -3233,7 +3231,7 @@ sycl::event hpr2(backend_selector selector, uplo upper_lower, const std::complex* y, std::int64_t incy, std::complex* a, const std::vector& dependencies) { auto done = oneapi::math::blas::generic::MAJOR::hpr2(selector.get_queue(), upper_lower, n, - alpha, x, incx, y, incy, a, dependencies); + alpha, x, incx, y, incy, a, dependencies); return done; } @@ -3243,7 +3241,7 @@ sycl::event gbmv(backend_selector selector, transpose trans, s std::int64_t incy, const std::vector& dependencies) { auto done = oneapi::math::blas::generic::MAJOR::gbmv(selector.get_queue(), trans, m, n, kl, ku, alpha, - a, lda, x, incx, beta, y, incy, dependencies); + a, lda, x, incx, beta, y, incy, dependencies); return done; } @@ -3253,7 +3251,7 @@ sycl::event gbmv(backend_selector selector, transpose trans, s std::int64_t incy, const std::vector& dependencies) { auto done = oneapi::math::blas::generic::MAJOR::gbmv(selector.get_queue(), trans, m, n, kl, ku, alpha, - a, lda, x, incx, beta, y, incy, dependencies); + a, lda, x, incx, beta, y, incy, dependencies); return done; } @@ -3264,7 +3262,7 @@ sycl::event gbmv(backend_selector selector, transpose trans, s std::int64_t incy, const std::vector& dependencies) { auto done = oneapi::math::blas::generic::MAJOR::gbmv(selector.get_queue(), trans, m, n, kl, ku, alpha, - a, lda, x, incx, beta, y, incy, dependencies); + a, lda, x, incx, beta, y, incy, dependencies); return done; } @@ -3275,7 +3273,7 @@ sycl::event gbmv(backend_selector selector, transpose trans, s std::int64_t incy, const std::vector& dependencies) { auto done = oneapi::math::blas::generic::MAJOR::gbmv(selector.get_queue(), trans, m, n, kl, ku, alpha, - a, lda, x, incx, beta, y, incy, dependencies); + a, lda, x, incx, beta, y, incy, dependencies); return done; } @@ -3318,8 +3316,8 @@ sycl::event symm(backend_selector selector, side left_right, u const float* b, std::int64_t ldb, float beta, float* c, std::int64_t ldc, const std::vector& dependencies) { auto done = oneapi::math::blas::generic::MAJOR::symm(selector.get_queue(), left_right, - upper_lower, m, n, alpha, a, lda, b, ldb, - beta, c, ldc, dependencies); + upper_lower, m, n, alpha, a, lda, b, ldb, + beta, c, ldc, dependencies); return done; } @@ -3328,8 +3326,8 @@ sycl::event symm(backend_selector selector, side left_right, u const double* b, std::int64_t ldb, double beta, double* c, std::int64_t ldc, const std::vector& dependencies) { auto done = oneapi::math::blas::generic::MAJOR::symm(selector.get_queue(), left_right, - upper_lower, m, n, alpha, a, lda, b, ldb, - beta, c, ldc, dependencies); + upper_lower, m, n, alpha, a, lda, b, ldb, + beta, c, ldc, dependencies); return done; } @@ -3339,8 +3337,8 @@ sycl::event symm(backend_selector selector, side left_right, u std::int64_t ldb, std::complex beta, std::complex* c, std::int64_t ldc, const std::vector& dependencies) { auto done = oneapi::math::blas::generic::MAJOR::symm(selector.get_queue(), left_right, - upper_lower, m, n, alpha, a, lda, b, ldb, - beta, c, ldc, dependencies); + upper_lower, m, n, alpha, a, lda, b, ldb, + beta, c, ldc, dependencies); return done; } @@ -3350,8 +3348,8 @@ sycl::event symm(backend_selector selector, side left_right, u std::int64_t ldb, std::complex beta, std::complex* c, std::int64_t ldc, const std::vector& dependencies) { auto done = oneapi::math::blas::generic::MAJOR::symm(selector.get_queue(), left_right, - upper_lower, m, n, alpha, a, lda, b, ldb, - beta, c, ldc, dependencies); + upper_lower, m, n, alpha, a, lda, b, ldb, + beta, c, ldc, dependencies); return done; } @@ -3360,7 +3358,7 @@ sycl::event dotc(backend_selector selector, std::int64_t n, std::int64_t incy, std::complex* result, const std::vector& dependencies) { auto done = oneapi::math::blas::generic::MAJOR::dotc(selector.get_queue(), n, x, incx, y, incy, - result, dependencies); + result, dependencies); return done; } @@ -3369,23 +3367,23 @@ sycl::event dotc(backend_selector selector, std::int64_t n, std::int64_t incy, std::complex* result, const std::vector& dependencies) { auto done = oneapi::math::blas::generic::MAJOR::dotc(selector.get_queue(), n, x, incx, y, incy, - result, dependencies); + result, dependencies); return done; } sycl::event syr(backend_selector selector, uplo upper_lower, std::int64_t n, float alpha, const float* x, std::int64_t incx, float* a, std::int64_t lda, const std::vector& dependencies) { - auto done = oneapi::math::blas::generic::MAJOR::syr(selector.get_queue(), upper_lower, n, - alpha, x, incx, a, lda, dependencies); + auto done = oneapi::math::blas::generic::MAJOR::syr(selector.get_queue(), upper_lower, n, alpha, + x, incx, a, lda, dependencies); return done; } sycl::event syr(backend_selector selector, uplo upper_lower, std::int64_t n, double alpha, const double* x, std::int64_t incx, double* a, std::int64_t lda, const std::vector& dependencies) { - auto done = oneapi::math::blas::generic::MAJOR::syr(selector.get_queue(), upper_lower, n, - alpha, x, incx, a, lda, dependencies); + auto done = oneapi::math::blas::generic::MAJOR::syr(selector.get_queue(), upper_lower, n, alpha, + x, incx, a, lda, dependencies); return done; } @@ -3394,8 +3392,8 @@ sycl::event trmm(backend_selector selector, side left_right, u const float* a, std::int64_t lda, float* b, std::int64_t ldb, const std::vector& dependencies) { auto done = oneapi::math::blas::generic::MAJOR::trmm(selector.get_queue(), left_right, - upper_lower, trans, unit_diag, m, n, - alpha, a, lda, b, ldb, dependencies); + upper_lower, trans, unit_diag, m, n, alpha, + a, lda, b, ldb, dependencies); return done; } @@ -3404,8 +3402,8 @@ sycl::event trmm(backend_selector selector, side left_right, u const double* a, std::int64_t lda, double* b, std::int64_t ldb, const std::vector& dependencies) { auto done = oneapi::math::blas::generic::MAJOR::trmm(selector.get_queue(), left_right, - upper_lower, trans, unit_diag, m, n, - alpha, a, lda, b, ldb, dependencies); + upper_lower, trans, unit_diag, m, n, alpha, + a, lda, b, ldb, dependencies); return done; } @@ -3415,8 +3413,8 @@ sycl::event trmm(backend_selector selector, side left_right, u std::complex* b, std::int64_t ldb, const std::vector& dependencies) { auto done = oneapi::math::blas::generic::MAJOR::trmm(selector.get_queue(), left_right, - upper_lower, trans, unit_diag, m, n, - alpha, a, lda, b, ldb, dependencies); + upper_lower, trans, unit_diag, m, n, alpha, + a, lda, b, ldb, dependencies); return done; } @@ -3426,22 +3424,22 @@ sycl::event trmm(backend_selector selector, side left_right, u std::complex* b, std::int64_t ldb, const std::vector& dependencies) { auto done = oneapi::math::blas::generic::MAJOR::trmm(selector.get_queue(), left_right, - upper_lower, trans, unit_diag, m, n, - alpha, a, lda, b, ldb, dependencies); + upper_lower, trans, unit_diag, m, n, alpha, + a, lda, b, ldb, dependencies); return done; } sycl::event rotmg(backend_selector selector, float* d1, float* d2, float* x1, float y1, float* param, const std::vector& dependencies) { auto done = oneapi::math::blas::generic::MAJOR::rotmg(selector.get_queue(), d1, d2, x1, y1, - param, dependencies); + param, dependencies); return done; } sycl::event rotmg(backend_selector selector, double* d1, double* d2, double* x1, double y1, double* param, const std::vector& dependencies) { auto done = oneapi::math::blas::generic::MAJOR::rotmg(selector.get_queue(), d1, d2, x1, y1, - param, dependencies); + param, dependencies); return done; } @@ -3449,7 +3447,7 @@ sycl::event tpsv(backend_selector selector, uplo upper_lower, diag unit_diag, std::int64_t n, const float* a, float* x, std::int64_t incx, const std::vector& dependencies) { auto done = oneapi::math::blas::generic::MAJOR::tpsv(selector.get_queue(), upper_lower, trans, - unit_diag, n, a, x, incx, dependencies); + unit_diag, n, a, x, incx, dependencies); return done; } @@ -3457,7 +3455,7 @@ sycl::event tpsv(backend_selector selector, uplo upper_lower, diag unit_diag, std::int64_t n, const double* a, double* x, std::int64_t incx, const std::vector& dependencies) { auto done = oneapi::math::blas::generic::MAJOR::tpsv(selector.get_queue(), upper_lower, trans, - unit_diag, n, a, x, incx, dependencies); + unit_diag, n, a, x, incx, dependencies); return done; } @@ -3466,7 +3464,7 @@ sycl::event tpsv(backend_selector selector, uplo upper_lower, std::complex* x, std::int64_t incx, const std::vector& dependencies) { auto done = oneapi::math::blas::generic::MAJOR::tpsv(selector.get_queue(), upper_lower, trans, - unit_diag, n, a, x, incx, dependencies); + unit_diag, n, a, x, incx, dependencies); return done; } @@ -3475,7 +3473,7 @@ sycl::event tpsv(backend_selector selector, uplo upper_lower, std::complex* x, std::int64_t incx, const std::vector& dependencies) { auto done = oneapi::math::blas::generic::MAJOR::tpsv(selector.get_queue(), upper_lower, trans, - unit_diag, n, a, x, incx, dependencies); + unit_diag, n, a, x, incx, dependencies); return done; } @@ -3517,7 +3515,7 @@ sycl::event copy(backend_selector selector, std::int64_t n, co std::int64_t incx, float* y, std::int64_t incy, const std::vector& dependencies) { auto done = oneapi::math::blas::generic::MAJOR::copy(selector.get_queue(), n, x, incx, y, incy, - dependencies); + dependencies); return done; } @@ -3525,7 +3523,7 @@ sycl::event copy(backend_selector selector, std::int64_t n, co std::int64_t incx, double* y, std::int64_t incy, const std::vector& dependencies) { auto done = oneapi::math::blas::generic::MAJOR::copy(selector.get_queue(), n, x, incx, y, incy, - dependencies); + dependencies); return done; } @@ -3533,7 +3531,7 @@ sycl::event copy(backend_selector selector, std::int64_t n, const std::complex* x, std::int64_t incx, std::complex* y, std::int64_t incy, const std::vector& dependencies) { auto done = oneapi::math::blas::generic::MAJOR::copy(selector.get_queue(), n, x, incx, y, incy, - dependencies); + dependencies); return done; } @@ -3541,7 +3539,7 @@ sycl::event copy(backend_selector selector, std::int64_t n, const std::complex* x, std::int64_t incx, std::complex* y, std::int64_t incy, const std::vector& dependencies) { auto done = oneapi::math::blas::generic::MAJOR::copy(selector.get_queue(), n, x, incx, y, incy, - dependencies); + dependencies); return done; } @@ -3590,9 +3588,9 @@ sycl::event copy_batch(backend_selector selector, std::int64_t return done; } -sycl::event copy_batch(backend_selector selector, std::int64_t n, - const double* x, std::int64_t incx, std::int64_t stridex, double* y, - std::int64_t incy, std::int64_t stridey, std::int64_t batch_size, +sycl::event copy_batch(backend_selector selector, std::int64_t n, const double* x, + std::int64_t incx, std::int64_t stridex, double* y, std::int64_t incy, + std::int64_t stridey, std::int64_t batch_size, const std::vector& dependencies) { auto done = oneapi::math::blas::generic::MAJOR::copy_batch( selector.get_queue(), n, x, incx, stridex, y, incy, stridey, batch_size, dependencies); @@ -3641,9 +3639,9 @@ sycl::event gemmt(backend_selector selector, uplo upper_lower, transpose transb, std::int64_t n, std::int64_t k, float alpha, const float* a, std::int64_t lda, const float* b, std::int64_t ldb, float beta, float* c, std::int64_t ldc, const std::vector& dependencies) { - auto done = oneapi::math::blas::generic::MAJOR::gemmt(selector.get_queue(), upper_lower, - transa, transb, n, k, alpha, a, lda, b, - ldb, beta, c, ldc, dependencies); + auto done = oneapi::math::blas::generic::MAJOR::gemmt(selector.get_queue(), upper_lower, transa, + transb, n, k, alpha, a, lda, b, ldb, beta, + c, ldc, dependencies); return done; } @@ -3651,9 +3649,9 @@ sycl::event gemmt(backend_selector selector, uplo upper_lower, transpose transb, std::int64_t n, std::int64_t k, double alpha, const double* a, std::int64_t lda, const double* b, std::int64_t ldb, double beta, double* c, std::int64_t ldc, const std::vector& dependencies) { - auto done = oneapi::math::blas::generic::MAJOR::gemmt(selector.get_queue(), upper_lower, - transa, transb, n, k, alpha, a, lda, b, - ldb, beta, c, ldc, dependencies); + auto done = oneapi::math::blas::generic::MAJOR::gemmt(selector.get_queue(), upper_lower, transa, + transb, n, k, alpha, a, lda, b, ldb, beta, + c, ldc, dependencies); return done; } @@ -3662,9 +3660,9 @@ sycl::event gemmt(backend_selector selector, uplo upper_lower, const std::complex* a, std::int64_t lda, const std::complex* b, std::int64_t ldb, std::complex beta, std::complex* c, std::int64_t ldc, const std::vector& dependencies) { - auto done = oneapi::math::blas::generic::MAJOR::gemmt(selector.get_queue(), upper_lower, - transa, transb, n, k, alpha, a, lda, b, - ldb, beta, c, ldc, dependencies); + auto done = oneapi::math::blas::generic::MAJOR::gemmt(selector.get_queue(), upper_lower, transa, + transb, n, k, alpha, a, lda, b, ldb, beta, + c, ldc, dependencies); return done; } @@ -3673,9 +3671,9 @@ sycl::event gemmt(backend_selector selector, uplo upper_lower, const std::complex* a, std::int64_t lda, const std::complex* b, std::int64_t ldb, std::complex beta, std::complex* c, std::int64_t ldc, const std::vector& dependencies) { - auto done = oneapi::math::blas::generic::MAJOR::gemmt(selector.get_queue(), upper_lower, - transa, transb, n, k, alpha, a, lda, b, - ldb, beta, c, ldc, dependencies); + auto done = oneapi::math::blas::generic::MAJOR::gemmt(selector.get_queue(), upper_lower, transa, + transb, n, k, alpha, a, lda, b, ldb, beta, + c, ldc, dependencies); return done; } @@ -3685,7 +3683,7 @@ sycl::event sbmv(backend_selector selector, uplo upper_lower, const std::vector& dependencies) { auto done = oneapi::math::blas::generic::MAJOR::sbmv(selector.get_queue(), upper_lower, n, k, alpha, a, - lda, x, incx, beta, y, incy, dependencies); + lda, x, incx, beta, y, incy, dependencies); return done; } @@ -3695,7 +3693,7 @@ sycl::event sbmv(backend_selector selector, uplo upper_lower, const std::vector& dependencies) { auto done = oneapi::math::blas::generic::MAJOR::sbmv(selector.get_queue(), upper_lower, n, k, alpha, a, - lda, x, incx, beta, y, incy, dependencies); + lda, x, incx, beta, y, incy, dependencies); return done; } @@ -3703,7 +3701,7 @@ sycl::event asum(backend_selector selector, std::int64_t n, const std::complex* x, std::int64_t incx, float* result, const std::vector& dependencies) { auto done = oneapi::math::blas::generic::MAJOR::asum(selector.get_queue(), n, x, incx, result, - dependencies); + dependencies); return done; } @@ -3711,21 +3709,21 @@ sycl::event asum(backend_selector selector, std::int64_t n, const std::complex* x, std::int64_t incx, double* result, const std::vector& dependencies) { auto done = oneapi::math::blas::generic::MAJOR::asum(selector.get_queue(), n, x, incx, result, - dependencies); + dependencies); return done; } sycl::event asum(backend_selector selector, std::int64_t n, const float* x, std::int64_t incx, float* result, const std::vector& dependencies) { auto done = oneapi::math::blas::generic::MAJOR::asum(selector.get_queue(), n, x, incx, result, - dependencies); + dependencies); return done; } sycl::event asum(backend_selector selector, std::int64_t n, const double* x, std::int64_t incx, double* result, const std::vector& dependencies) { auto done = oneapi::math::blas::generic::MAJOR::asum(selector.get_queue(), n, x, incx, result, - dependencies); + dependencies); return done; } @@ -3767,7 +3765,7 @@ sycl::event spr2(backend_selector selector, uplo upper_lower, float alpha, const float* x, std::int64_t incx, const float* y, std::int64_t incy, float* a, const std::vector& dependencies) { auto done = oneapi::math::blas::generic::MAJOR::spr2(selector.get_queue(), upper_lower, n, - alpha, x, incx, y, incy, a, dependencies); + alpha, x, incx, y, incy, a, dependencies); return done; } @@ -3775,7 +3773,7 @@ sycl::event spr2(backend_selector selector, uplo upper_lower, double alpha, const double* x, std::int64_t incx, const double* y, std::int64_t incy, double* a, const std::vector& dependencies) { auto done = oneapi::math::blas::generic::MAJOR::spr2(selector.get_queue(), upper_lower, n, - alpha, x, incx, y, incy, a, dependencies); + alpha, x, incx, y, incy, a, dependencies); return done; } @@ -3783,7 +3781,7 @@ sycl::event iamax(backend_selector selector, std::int64_t n, c std::int64_t incx, std::int64_t* result, const std::vector& dependencies) { auto done = oneapi::math::blas::generic::MAJOR::iamax(selector.get_queue(), n, x, incx, result, - dependencies); + dependencies); return done; } @@ -3791,7 +3789,7 @@ sycl::event iamax(backend_selector selector, std::int64_t n, c std::int64_t incx, std::int64_t* result, const std::vector& dependencies) { auto done = oneapi::math::blas::generic::MAJOR::iamax(selector.get_queue(), n, x, incx, result, - dependencies); + dependencies); return done; } @@ -3799,7 +3797,7 @@ sycl::event iamax(backend_selector selector, std::int64_t n, const std::complex* x, std::int64_t incx, std::int64_t* result, const std::vector& dependencies) { auto done = oneapi::math::blas::generic::MAJOR::iamax(selector.get_queue(), n, x, incx, result, - dependencies); + dependencies); return done; } @@ -3807,7 +3805,7 @@ sycl::event iamax(backend_selector selector, std::int64_t n, const std::complex* x, std::int64_t incx, std::int64_t* result, const std::vector& dependencies) { auto done = oneapi::math::blas::generic::MAJOR::iamax(selector.get_queue(), n, x, incx, result, - dependencies); + dependencies); return done; } @@ -3815,7 +3813,7 @@ sycl::event rotm(backend_selector selector, std::int64_t n, fl std::int64_t incx, float* y, std::int64_t incy, float* param, const std::vector& dependencies) { auto done = oneapi::math::blas::generic::MAJOR::rotm(selector.get_queue(), n, x, incx, y, incy, - param, dependencies); + param, dependencies); return done; } @@ -3823,7 +3821,7 @@ sycl::event rotm(backend_selector selector, std::int64_t n, do std::int64_t incx, double* y, std::int64_t incy, double* param, const std::vector& dependencies) { auto done = oneapi::math::blas::generic::MAJOR::rotm(selector.get_queue(), n, x, incx, y, incy, - param, dependencies); + param, dependencies); return done; } @@ -3861,7 +3859,7 @@ sycl::event sdsdot(backend_selector selector, std::int64_t n, const float* x, std::int64_t incx, const float* y, std::int64_t incy, float* result, const std::vector& dependencies) { auto done = oneapi::math::blas::generic::MAJOR::sdsdot(selector.get_queue(), n, sb, x, incx, y, - incy, result, dependencies); + incy, result, dependencies); return done; } @@ -3871,8 +3869,8 @@ sycl::event her2k(backend_selector selector, uplo upper_lower, std::int64_t ldb, float beta, std::complex* c, std::int64_t ldc, const std::vector& dependencies) { auto done = oneapi::math::blas::generic::MAJOR::her2k(selector.get_queue(), upper_lower, trans, - n, k, alpha, a, lda, b, ldb, beta, c, - ldc, dependencies); + n, k, alpha, a, lda, b, ldb, beta, c, ldc, + dependencies); return done; } @@ -3882,8 +3880,8 @@ sycl::event her2k(backend_selector selector, uplo upper_lower, std::int64_t ldb, double beta, std::complex* c, std::int64_t ldc, const std::vector& dependencies) { auto done = oneapi::math::blas::generic::MAJOR::her2k(selector.get_queue(), upper_lower, trans, - n, k, alpha, a, lda, b, ldb, beta, c, - ldc, dependencies); + n, k, alpha, a, lda, b, ldb, beta, c, ldc, + dependencies); return done; } @@ -3891,7 +3889,7 @@ sycl::event dot(backend_selector selector, std::int64_t n, con std::int64_t incx, const float* y, std::int64_t incy, float* result, const std::vector& dependencies) { auto done = oneapi::math::blas::generic::MAJOR::dot(selector.get_queue(), n, x, incx, y, incy, - result, dependencies); + result, dependencies); return done; } @@ -3899,7 +3897,7 @@ sycl::event dot(backend_selector selector, std::int64_t n, con std::int64_t incx, const double* y, std::int64_t incy, double* result, const std::vector& dependencies) { auto done = oneapi::math::blas::generic::MAJOR::dot(selector.get_queue(), n, x, incx, y, incy, - result, dependencies); + result, dependencies); return done; } @@ -3907,7 +3905,7 @@ sycl::event dot(backend_selector selector, std::int64_t n, con std::int64_t incx, const float* y, std::int64_t incy, double* result, const std::vector& dependencies) { auto done = oneapi::math::blas::generic::MAJOR::dot(selector.get_queue(), n, x, incx, y, incy, - result, dependencies); + result, dependencies); return done; } @@ -4065,7 +4063,7 @@ sycl::event omatcopy(backend_selector selector, transpose tran std::int64_t n, float alpha, const float* a, std::int64_t lda, float* b, std::int64_t ldb, const std::vector& dependencies) { auto done = oneapi::math::blas::generic::MAJOR::omatcopy(selector.get_queue(), trans, m, n, - alpha, a, lda, b, ldb, dependencies); + alpha, a, lda, b, ldb, dependencies); return done; } @@ -4073,7 +4071,7 @@ sycl::event omatcopy(backend_selector selector, transpose tran std::int64_t n, double alpha, const double* a, std::int64_t lda, double* b, std::int64_t ldb, const std::vector& dependencies) { auto done = oneapi::math::blas::generic::MAJOR::omatcopy(selector.get_queue(), trans, m, n, - alpha, a, lda, b, ldb, dependencies); + alpha, a, lda, b, ldb, dependencies); return done; } @@ -4082,7 +4080,7 @@ sycl::event omatcopy(backend_selector selector, transpose tran std::int64_t lda, std::complex* b, std::int64_t ldb, const std::vector& dependencies) { auto done = oneapi::math::blas::generic::MAJOR::omatcopy(selector.get_queue(), trans, m, n, - alpha, a, lda, b, ldb, dependencies); + alpha, a, lda, b, ldb, dependencies); return done; } @@ -4091,7 +4089,7 @@ sycl::event omatcopy(backend_selector selector, transpose tran std::int64_t lda, std::complex* b, std::int64_t ldb, const std::vector& dependencies) { auto done = oneapi::math::blas::generic::MAJOR::omatcopy(selector.get_queue(), trans, m, n, - alpha, a, lda, b, ldb, dependencies); + alpha, a, lda, b, ldb, dependencies); return done; } @@ -4137,7 +4135,7 @@ sycl::event imatcopy(backend_selector selector, transpose tran std::int64_t n, float alpha, float* ab, std::int64_t lda, std::int64_t ldb, const std::vector& dependencies) { auto done = oneapi::math::blas::generic::MAJOR::imatcopy(selector.get_queue(), trans, m, n, - alpha, ab, lda, ldb, dependencies); + alpha, ab, lda, ldb, dependencies); return done; } @@ -4145,7 +4143,7 @@ sycl::event imatcopy(backend_selector selector, transpose tran std::int64_t n, double alpha, double* ab, std::int64_t lda, std::int64_t ldb, const std::vector& dependencies) { auto done = oneapi::math::blas::generic::MAJOR::imatcopy(selector.get_queue(), trans, m, n, - alpha, ab, lda, ldb, dependencies); + alpha, ab, lda, ldb, dependencies); return done; } @@ -4154,7 +4152,7 @@ sycl::event imatcopy(backend_selector selector, transpose tran std::int64_t lda, std::int64_t ldb, const std::vector& dependencies) { auto done = oneapi::math::blas::generic::MAJOR::imatcopy(selector.get_queue(), trans, m, n, - alpha, ab, lda, ldb, dependencies); + alpha, ab, lda, ldb, dependencies); return done; } @@ -4163,49 +4161,49 @@ sycl::event imatcopy(backend_selector selector, transpose tran std::int64_t lda, std::int64_t ldb, const std::vector& dependencies) { auto done = oneapi::math::blas::generic::MAJOR::imatcopy(selector.get_queue(), trans, m, n, - alpha, ab, lda, ldb, dependencies); + alpha, ab, lda, ldb, dependencies); return done; } -sycl::event omatadd(backend_selector selector, transpose transa, - transpose transb, std::int64_t m, std::int64_t n, float alpha, const float* a, - std::int64_t lda, float beta, const float* b, std::int64_t ldb, float* c, - std::int64_t ldc, const std::vector& dependencies) { - auto done = oneapi::math::blas::generic::MAJOR::omatadd(selector.get_queue(), transa, transb, - m, n, alpha, a, lda, beta, b, ldb, c, - ldc, dependencies); +sycl::event omatadd(backend_selector selector, transpose transa, transpose transb, + std::int64_t m, std::int64_t n, float alpha, const float* a, std::int64_t lda, + float beta, const float* b, std::int64_t ldb, float* c, std::int64_t ldc, + const std::vector& dependencies) { + auto done = oneapi::math::blas::generic::MAJOR::omatadd(selector.get_queue(), transa, transb, m, + n, alpha, a, lda, beta, b, ldb, c, ldc, + dependencies); return done; } -sycl::event omatadd(backend_selector selector, transpose transa, - transpose transb, std::int64_t m, std::int64_t n, double alpha, const double* a, - std::int64_t lda, double beta, const double* b, std::int64_t ldb, double* c, - std::int64_t ldc, const std::vector& dependencies) { - auto done = oneapi::math::blas::generic::MAJOR::omatadd(selector.get_queue(), transa, transb, - m, n, alpha, a, lda, beta, b, ldb, c, - ldc, dependencies); +sycl::event omatadd(backend_selector selector, transpose transa, transpose transb, + std::int64_t m, std::int64_t n, double alpha, const double* a, std::int64_t lda, + double beta, const double* b, std::int64_t ldb, double* c, std::int64_t ldc, + const std::vector& dependencies) { + auto done = oneapi::math::blas::generic::MAJOR::omatadd(selector.get_queue(), transa, transb, m, + n, alpha, a, lda, beta, b, ldb, c, ldc, + dependencies); return done; } -sycl::event omatadd(backend_selector selector, transpose transa, - transpose transb, std::int64_t m, std::int64_t n, std::complex alpha, +sycl::event omatadd(backend_selector selector, transpose transa, transpose transb, + std::int64_t m, std::int64_t n, std::complex alpha, const std::complex* a, std::int64_t lda, std::complex beta, const std::complex* b, std::int64_t ldb, std::complex* c, std::int64_t ldc, const std::vector& dependencies) { - auto done = oneapi::math::blas::generic::MAJOR::omatadd(selector.get_queue(), transa, transb, - m, n, alpha, a, lda, beta, b, ldb, c, - ldc, dependencies); + auto done = oneapi::math::blas::generic::MAJOR::omatadd(selector.get_queue(), transa, transb, m, + n, alpha, a, lda, beta, b, ldb, c, ldc, + dependencies); return done; } -sycl::event omatadd(backend_selector selector, transpose transa, - transpose transb, std::int64_t m, std::int64_t n, std::complex alpha, +sycl::event omatadd(backend_selector selector, transpose transa, transpose transb, + std::int64_t m, std::int64_t n, std::complex alpha, const std::complex* a, std::int64_t lda, std::complex beta, const std::complex* b, std::int64_t ldb, std::complex* c, std::int64_t ldc, const std::vector& dependencies) { - auto done = oneapi::math::blas::generic::MAJOR::omatadd(selector.get_queue(), transa, transb, - m, n, alpha, a, lda, beta, b, ldb, c, - ldc, dependencies); + auto done = oneapi::math::blas::generic::MAJOR::omatadd(selector.get_queue(), transa, transb, m, + n, alpha, a, lda, beta, b, ldb, c, ldc, + dependencies); return done; } diff --git a/src/blas/backends/generic/generic_batch.cxx b/src/blas/backends/generic/generic_batch.cxx index b0b900829..7a6af6070 100644 --- a/src/blas/backends/generic/generic_batch.cxx +++ b/src/blas/backends/generic/generic_batch.cxx @@ -119,14 +119,14 @@ void axpy_batch(sycl::queue& queue, std::int64_t n, float alpha, sycl::buffer& y, std::int64_t incy, std::int64_t stridey, std::int64_t batch_size) { CALL_GENERIC_BLAS_FN(::blas::_axpy_batch, queue, n, alpha, x, incx, stridex, y, incy, stridey, - batch_size); + batch_size); } void axpy_batch(sycl::queue& queue, std::int64_t n, double alpha, sycl::buffer& x, std::int64_t incx, std::int64_t stridex, sycl::buffer& y, std::int64_t incy, std::int64_t stridey, std::int64_t batch_size) { CALL_GENERIC_BLAS_FN(::blas::_axpy_batch, queue, n, alpha, x, incx, stridex, y, incy, stridey, - batch_size); + batch_size); } void axpy_batch(sycl::queue& queue, std::int64_t n, std::complex alpha, @@ -172,8 +172,8 @@ void gemm_batch(sycl::queue& queue, oneapi::math::transpose transa, oneapi::math sycl::buffer& b, std::int64_t ldb, std::int64_t stride_b, float beta, sycl::buffer& c, std::int64_t ldc, std::int64_t stride_c, std::int64_t batch_size) { - CALL_GENERIC_BLAS_FN(::blas::_gemm_strided_batched, queue, transa, transb, m, n, k, alpha, a, lda, - stride_a, b, ldb, stride_b, beta, c, ldc, stride_c, batch_size); + CALL_GENERIC_BLAS_FN(::blas::_gemm_strided_batched, queue, transa, transb, m, n, k, alpha, a, + lda, stride_a, b, ldb, stride_b, beta, c, ldc, stride_c, batch_size); } void gemm_batch(sycl::queue& queue, oneapi::math::transpose transa, oneapi::math::transpose transb, @@ -182,8 +182,8 @@ void gemm_batch(sycl::queue& queue, oneapi::math::transpose transa, oneapi::math sycl::buffer& b, std::int64_t ldb, std::int64_t stride_b, double beta, sycl::buffer& c, std::int64_t ldc, std::int64_t stride_c, std::int64_t batch_size) { - CALL_GENERIC_BLAS_FN(::blas::_gemm_strided_batched, queue, transa, transb, m, n, k, alpha, a, lda, - stride_a, b, ldb, stride_b, beta, c, ldc, stride_c, batch_size); + CALL_GENERIC_BLAS_FN(::blas::_gemm_strided_batched, queue, transa, transb, m, n, k, alpha, a, + lda, stride_a, b, ldb, stride_b, beta, c, ldc, stride_c, batch_size); } void gemm_batch(sycl::queue& queue, oneapi::math::transpose transa, oneapi::math::transpose transb, @@ -277,16 +277,16 @@ void omatcopy_batch(sycl::queue& queue, oneapi::math::transpose trans, std::int6 std::int64_t n, float alpha, sycl::buffer& a, std::int64_t lda, std::int64_t stride_a, sycl::buffer& b, std::int64_t ldb, std::int64_t stride_b, std::int64_t batch_size) { - CALL_GENERIC_BLAS_FN(::blas::_omatcopy_batch, queue, trans, m, n, alpha, a, lda, stride_a, b, ldb, - stride_b, batch_size); + CALL_GENERIC_BLAS_FN(::blas::_omatcopy_batch, queue, trans, m, n, alpha, a, lda, stride_a, b, + ldb, stride_b, batch_size); } void omatcopy_batch(sycl::queue& queue, oneapi::math::transpose trans, std::int64_t m, std::int64_t n, double alpha, sycl::buffer& a, std::int64_t lda, std::int64_t stride_a, sycl::buffer& b, std::int64_t ldb, std::int64_t stride_b, std::int64_t batch_size) { - CALL_GENERIC_BLAS_FN(::blas::_omatcopy_batch, queue, trans, m, n, alpha, a, lda, stride_a, b, ldb, - stride_b, batch_size); + CALL_GENERIC_BLAS_FN(::blas::_omatcopy_batch, queue, trans, m, n, alpha, a, lda, stride_a, b, + ldb, stride_b, batch_size); } void omatcopy_batch(sycl::queue& queue, oneapi::math::transpose trans, std::int64_t m, @@ -337,8 +337,8 @@ void omatadd_batch(sycl::queue& queue, oneapi::math::transpose transa, sycl::buffer& b, std::int64_t ldb, std::int64_t stride_b, sycl::buffer& c, std::int64_t ldc, std::int64_t stride_c, std::int64_t batch_size) { - CALL_GENERIC_BLAS_FN(::blas::_omatadd_batch, queue, transa, transb, m, n, alpha, a, lda, stride_a, - beta, b, ldb, stride_b, c, ldc, stride_c, batch_size); + CALL_GENERIC_BLAS_FN(::blas::_omatadd_batch, queue, transa, transb, m, n, alpha, a, lda, + stride_a, beta, b, ldb, stride_b, c, ldc, stride_c, batch_size); } void omatadd_batch(sycl::queue& queue, oneapi::math::transpose transa, @@ -347,8 +347,8 @@ void omatadd_batch(sycl::queue& queue, oneapi::math::transpose transa, sycl::buffer& b, std::int64_t ldb, std::int64_t stride_b, sycl::buffer& c, std::int64_t ldc, std::int64_t stride_c, std::int64_t batch_size) { - CALL_GENERIC_BLAS_FN(::blas::_omatadd_batch, queue, transa, transb, m, n, alpha, a, lda, stride_a, - beta, b, ldb, stride_b, c, ldc, stride_c, batch_size); + CALL_GENERIC_BLAS_FN(::blas::_omatadd_batch, queue, transa, transb, m, n, alpha, a, lda, + stride_a, beta, b, ldb, stride_b, c, ldc, stride_c, batch_size); } void omatadd_batch(sycl::queue& queue, oneapi::math::transpose transa, @@ -605,16 +605,16 @@ sycl::event axpy_batch(sycl::queue& queue, std::int64_t n, float alpha, const fl std::int64_t incx, std::int64_t stridex, float* y, std::int64_t incy, std::int64_t stridey, std::int64_t batch_size, const std::vector& dependencies) { - CALL_GENERIC_BLAS_USM_FN(::blas::_axpy_batch, queue, n, alpha, x, incx, stridex, y, incy, stridey, - batch_size, dependencies); + CALL_GENERIC_BLAS_USM_FN(::blas::_axpy_batch, queue, n, alpha, x, incx, stridex, y, incy, + stridey, batch_size, dependencies); } sycl::event axpy_batch(sycl::queue& queue, std::int64_t n, double alpha, const double* x, std::int64_t incx, std::int64_t stridex, double* y, std::int64_t incy, std::int64_t stridey, std::int64_t batch_size, const std::vector& dependencies) { - CALL_GENERIC_BLAS_USM_FN(::blas::_axpy_batch, queue, n, alpha, x, incx, stridex, y, incy, stridey, - batch_size, dependencies); + CALL_GENERIC_BLAS_USM_FN(::blas::_axpy_batch, queue, n, alpha, x, incx, stridex, y, incy, + stridey, batch_size, dependencies); } sycl::event axpy_batch(sycl::queue& queue, std::int64_t n, std::complex alpha, @@ -764,9 +764,9 @@ sycl::event gemm_batch(sycl::queue& queue, oneapi::math::transpose transa, std::int64_t stride_b, float beta, float* c, std::int64_t ldc, std::int64_t stride_c, std::int64_t batch_size, const std::vector& dependencies) { - CALL_GENERIC_BLAS_USM_FN(::blas::_gemm_strided_batched, queue, transa, transb, m, n, k, alpha, a, - lda, stride_a, b, ldb, stride_b, beta, c, ldc, stride_c, batch_size, - dependencies); + CALL_GENERIC_BLAS_USM_FN(::blas::_gemm_strided_batched, queue, transa, transb, m, n, k, alpha, + a, lda, stride_a, b, ldb, stride_b, beta, c, ldc, stride_c, batch_size, + dependencies); } sycl::event gemm_batch(sycl::queue& queue, oneapi::math::transpose transa, @@ -776,9 +776,9 @@ sycl::event gemm_batch(sycl::queue& queue, oneapi::math::transpose transa, std::int64_t stride_b, double beta, double* c, std::int64_t ldc, std::int64_t stride_c, std::int64_t batch_size, const std::vector& dependencies) { - CALL_GENERIC_BLAS_USM_FN(::blas::_gemm_strided_batched, queue, transa, transb, m, n, k, alpha, a, - lda, stride_a, b, ldb, stride_b, beta, c, ldc, stride_c, batch_size, - dependencies); + CALL_GENERIC_BLAS_USM_FN(::blas::_gemm_strided_batched, queue, transa, transb, m, n, k, alpha, + a, lda, stride_a, b, ldb, stride_b, beta, c, ldc, stride_c, batch_size, + dependencies); } sycl::event gemm_batch(sycl::queue& queue, oneapi::math::transpose transa, @@ -920,8 +920,8 @@ sycl::event omatcopy_batch(sycl::queue& queue, oneapi::math::transpose trans, st std::int64_t n, float alpha, const float* a, std::int64_t lda, std::int64_t stride_a, float* b, std::int64_t ldb, std::int64_t stride_b, std::int64_t batch_size, const std::vector& dependencies) { - CALL_GENERIC_BLAS_USM_FN(::blas::_omatcopy_batch, queue, trans, m, n, alpha, a, lda, stride_a, b, - ldb, stride_b, batch_size, dependencies); + CALL_GENERIC_BLAS_USM_FN(::blas::_omatcopy_batch, queue, trans, m, n, alpha, a, lda, stride_a, + b, ldb, stride_b, batch_size, dependencies); } sycl::event omatcopy_batch(sycl::queue& queue, oneapi::math::transpose trans, std::int64_t m, @@ -929,8 +929,8 @@ sycl::event omatcopy_batch(sycl::queue& queue, oneapi::math::transpose trans, st std::int64_t stride_a, double* b, std::int64_t ldb, std::int64_t stride_b, std::int64_t batch_size, const std::vector& dependencies) { - CALL_GENERIC_BLAS_USM_FN(::blas::_omatcopy_batch, queue, trans, m, n, alpha, a, lda, stride_a, b, - ldb, stride_b, batch_size, dependencies); + CALL_GENERIC_BLAS_USM_FN(::blas::_omatcopy_batch, queue, trans, m, n, alpha, a, lda, stride_a, + b, ldb, stride_b, batch_size, dependencies); } sycl::event omatcopy_batch(sycl::queue& queue, oneapi::math::transpose trans, std::int64_t m, @@ -984,8 +984,8 @@ sycl::event omatadd_batch(sycl::queue& queue, oneapi::math::transpose transa, float* c, std::int64_t ldc, std::int64_t stride_c, std::int64_t batch_size, const std::vector& dependencies) { CALL_GENERIC_BLAS_USM_FN(::blas::_omatadd_batch, queue, transa, transb, m, n, alpha, a, lda, - stride_a, beta, b, ldb, stride_b, c, ldc, stride_c, batch_size, - dependencies); + stride_a, beta, b, ldb, stride_b, c, ldc, stride_c, batch_size, + dependencies); } sycl::event omatadd_batch(sycl::queue& queue, oneapi::math::transpose transa, @@ -995,8 +995,8 @@ sycl::event omatadd_batch(sycl::queue& queue, oneapi::math::transpose transa, double* c, std::int64_t ldc, std::int64_t stride_c, std::int64_t batch_size, const std::vector& dependencies) { CALL_GENERIC_BLAS_USM_FN(::blas::_omatadd_batch, queue, transa, transb, m, n, alpha, a, lda, - stride_a, beta, b, ldb, stride_b, c, ldc, stride_c, batch_size, - dependencies); + stride_a, beta, b, ldb, stride_b, c, ldc, stride_c, batch_size, + dependencies); } sycl::event omatadd_batch(sycl::queue& queue, oneapi::math::transpose transa, diff --git a/src/blas/backends/generic/generic_common.hpp b/src/blas/backends/generic/generic_common.hpp index e0dc9ddd3..3b9726f58 100644 --- a/src/blas/backends/generic/generic_common.hpp +++ b/src/blas/backends/generic/generic_common.hpp @@ -54,9 +54,9 @@ template struct generic_type; #define DEF_GENERIC_BLAS_TYPE(onemath_t, generic_t) \ - template <> \ - struct generic_type { \ - using type = generic_t; \ + template <> \ + struct generic_type { \ + using type = generic_t; \ }; DEF_GENERIC_BLAS_TYPE(sycl::queue, handle_t) @@ -210,7 +210,7 @@ struct throw_if_unsupported_by_device { throw unimplemented("blas", "onemath_sycl_blas function"); \ } -#define CALL_GENERIC_BLAS_USM_FN(genericFunc, ...) \ +#define CALL_GENERIC_BLAS_USM_FN(genericFunc, ...) \ if constexpr (is_column_major()) { \ detail::throw_if_unsupported_by_device{}( \ " generic BLAS function requiring fp64 support", __VA_ARGS__); \ @@ -218,7 +218,7 @@ struct throw_if_unsupported_by_device { " generic BLAS function requiring fp16 support", __VA_ARGS__); \ auto args = detail::convert_to_generic_type(__VA_ARGS__); \ auto fn = [](auto&&... targs) { \ - return genericFunc(std::forward(targs)...).back(); \ + return genericFunc(std::forward(targs)...).back(); \ }; \ try { \ return std::apply(fn, args); \ diff --git a/src/blas/backends/generic/generic_level1.cxx b/src/blas/backends/generic/generic_level1.cxx index 6e617692b..02815c2a0 100644 --- a/src/blas/backends/generic/generic_level1.cxx +++ b/src/blas/backends/generic/generic_level1.cxx @@ -319,7 +319,8 @@ sycl::event sdsdot(sycl::queue& queue, std::int64_t n, real_t sb, const real_t* [&](sycl::handler& cgh) { cgh.single_task([=]() { result[0] = real_t(0); }); }); std::vector new_dependencies = dependencies; new_dependencies.emplace_back(init_res_val); - CALL_GENERIC_BLAS_USM_FN(::blas::_sdsdot, queue, n, sb, x, incx, y, incy, result, new_dependencies); + CALL_GENERIC_BLAS_USM_FN(::blas::_sdsdot, queue, n, sb, x, incx, y, incy, result, + new_dependencies); } sycl::event nrm2(sycl::queue& queue, std::int64_t n, const std::complex* x, diff --git a/src/blas/backends/generic/generic_level2.cxx b/src/blas/backends/generic/generic_level2.cxx index 255b3f895..03e805813 100644 --- a/src/blas/backends/generic/generic_level2.cxx +++ b/src/blas/backends/generic/generic_level2.cxx @@ -37,7 +37,7 @@ void gbmv(sycl::queue& queue, oneapi::math::transpose trans, std::int64_t m, std std::int64_t lda, sycl::buffer& x, std::int64_t incx, real_t beta, sycl::buffer& y, std::int64_t incy) { CALL_GENERIC_BLAS_FN(::blas::_gbmv, queue, trans, m, n, kl, ku, alpha, a, lda, x, incx, beta, y, - incy); + incy); } void gbmv(sycl::queue& queue, oneapi::math::transpose trans, std::int64_t m, std::int64_t n, @@ -119,13 +119,14 @@ void sbmv(sycl::queue& queue, oneapi::math::uplo upper_lower, std::int64_t n, st real_t alpha, sycl::buffer& a, std::int64_t lda, sycl::buffer& x, std::int64_t incx, real_t beta, sycl::buffer& y, std::int64_t incy) { CALL_GENERIC_BLAS_FN(::blas::_sbmv, queue, upper_lower, n, k, alpha, a, lda, x, incx, beta, y, - incy); + incy); } void symv(sycl::queue& queue, oneapi::math::uplo upper_lower, std::int64_t n, real_t alpha, sycl::buffer& a, std::int64_t lda, sycl::buffer& x, std::int64_t incx, real_t beta, sycl::buffer& y, std::int64_t incy) { - CALL_GENERIC_BLAS_FN(::blas::_symv, queue, upper_lower, n, alpha, a, lda, x, incx, beta, y, incy); + CALL_GENERIC_BLAS_FN(::blas::_symv, queue, upper_lower, n, alpha, a, lda, x, incx, beta, y, + incy); } void syr(sycl::queue& queue, oneapi::math::uplo upper_lower, std::int64_t n, real_t alpha, @@ -160,7 +161,8 @@ void spr2(sycl::queue& queue, oneapi::math::uplo upper_lower, std::int64_t n, re void tbmv(sycl::queue& queue, oneapi::math::uplo upper_lower, oneapi::math::transpose trans, oneapi::math::diag unit_diag, std::int64_t n, std::int64_t k, sycl::buffer& a, std::int64_t lda, sycl::buffer& x, std::int64_t incx) { - CALL_GENERIC_BLAS_FN(::blas::_tbmv, queue, upper_lower, trans, unit_diag, n, k, a, lda, x, incx); + CALL_GENERIC_BLAS_FN(::blas::_tbmv, queue, upper_lower, trans, unit_diag, n, k, a, lda, x, + incx); } void tbmv(sycl::queue& queue, oneapi::math::uplo upper_lower, oneapi::math::transpose trans, @@ -173,7 +175,8 @@ void tbmv(sycl::queue& queue, oneapi::math::uplo upper_lower, oneapi::math::tran void tbsv(sycl::queue& queue, oneapi::math::uplo upper_lower, oneapi::math::transpose trans, oneapi::math::diag unit_diag, std::int64_t n, std::int64_t k, sycl::buffer& a, std::int64_t lda, sycl::buffer& x, std::int64_t incx) { - CALL_GENERIC_BLAS_FN(::blas::_tbsv, queue, upper_lower, trans, unit_diag, n, k, a, lda, x, incx); + CALL_GENERIC_BLAS_FN(::blas::_tbsv, queue, upper_lower, trans, unit_diag, n, k, a, lda, x, + incx); } void tbsv(sycl::queue& queue, oneapi::math::uplo upper_lower, oneapi::math::transpose trans, @@ -237,8 +240,8 @@ sycl::event gemv(sycl::queue& queue, oneapi::math::transpose trans, std::int64_t real_t alpha, const real_t* a, std::int64_t lda, const real_t* x, std::int64_t incx, real_t beta, real_t* y, std::int64_t incy, const std::vector& dependencies) { - CALL_GENERIC_BLAS_USM_FN(::blas::_gemv, queue, trans, m, n, alpha, a, lda, x, incx, beta, y, incy, - dependencies); + CALL_GENERIC_BLAS_USM_FN(::blas::_gemv, queue, trans, m, n, alpha, a, lda, x, incx, beta, y, + incy, dependencies); } sycl::event gemv(sycl::queue& queue, oneapi::math::transpose trans, std::int64_t m, std::int64_t n, @@ -253,8 +256,8 @@ sycl::event gbmv(sycl::queue& queue, oneapi::math::transpose trans, std::int64_t std::int64_t kl, std::int64_t ku, real_t alpha, const real_t* a, std::int64_t lda, const real_t* x, std::int64_t incx, real_t beta, real_t* y, std::int64_t incy, const std::vector& dependencies) { - CALL_GENERIC_BLAS_USM_FN(::blas::_gbmv, queue, trans, m, n, kl, ku, alpha, a, lda, x, incx, beta, y, - incy, dependencies); + CALL_GENERIC_BLAS_USM_FN(::blas::_gbmv, queue, trans, m, n, kl, ku, alpha, a, lda, x, incx, + beta, y, incy, dependencies); } sycl::event gbmv(sycl::queue& queue, oneapi::math::transpose trans, std::int64_t m, std::int64_t n, @@ -268,7 +271,8 @@ sycl::event gbmv(sycl::queue& queue, oneapi::math::transpose trans, std::int64_t sycl::event ger(sycl::queue& queue, std::int64_t m, std::int64_t n, real_t alpha, const real_t* x, std::int64_t incx, const real_t* y, std::int64_t incy, real_t* a, std::int64_t lda, const std::vector& dependencies) { - CALL_GENERIC_BLAS_USM_FN(::blas::_ger, queue, m, n, alpha, x, incx, y, incy, a, lda, dependencies); + CALL_GENERIC_BLAS_USM_FN(::blas::_ger, queue, m, n, alpha, x, incx, y, incy, a, lda, + dependencies); } sycl::event gerc(sycl::queue& queue, std::int64_t m, std::int64_t n, std::complex alpha, @@ -339,35 +343,36 @@ sycl::event sbmv(sycl::queue& queue, oneapi::math::uplo upper_lower, std::int64_ real_t alpha, const real_t* a, std::int64_t lda, const real_t* x, std::int64_t incx, real_t beta, real_t* y, std::int64_t incy, const std::vector& dependencies) { - CALL_GENERIC_BLAS_USM_FN(::blas::_sbmv, queue, upper_lower, n, k, alpha, a, lda, x, incx, beta, y, - incy, dependencies); + CALL_GENERIC_BLAS_USM_FN(::blas::_sbmv, queue, upper_lower, n, k, alpha, a, lda, x, incx, beta, + y, incy, dependencies); } sycl::event symv(sycl::queue& queue, oneapi::math::uplo upper_lower, std::int64_t n, real_t alpha, const real_t* a, std::int64_t lda, const real_t* x, std::int64_t incx, real_t beta, real_t* y, std::int64_t incy, const std::vector& dependencies) { CALL_GENERIC_BLAS_USM_FN(::blas::_symv, queue, upper_lower, n, alpha, a, lda, x, incx, beta, y, - incy, dependencies); + incy, dependencies); } sycl::event syr(sycl::queue& queue, oneapi::math::uplo upper_lower, std::int64_t n, real_t alpha, const real_t* x, std::int64_t incx, real_t* a, std::int64_t lda, const std::vector& dependencies) { - CALL_GENERIC_BLAS_USM_FN(::blas::_syr, queue, upper_lower, n, alpha, x, incx, a, lda, dependencies); + CALL_GENERIC_BLAS_USM_FN(::blas::_syr, queue, upper_lower, n, alpha, x, incx, a, lda, + dependencies); } sycl::event syr2(sycl::queue& queue, oneapi::math::uplo upper_lower, std::int64_t n, real_t alpha, const real_t* x, std::int64_t incx, const real_t* y, std::int64_t incy, real_t* a, std::int64_t lda, const std::vector& dependencies) { CALL_GENERIC_BLAS_USM_FN(::blas::_syr2, queue, upper_lower, n, alpha, x, incx, y, incy, a, lda, - dependencies); + dependencies); } sycl::event spmv(sycl::queue& queue, oneapi::math::uplo upper_lower, std::int64_t n, real_t alpha, const real_t* a, const real_t* x, std::int64_t incx, real_t beta, real_t* y, std::int64_t incy, const std::vector& dependencies) { CALL_GENERIC_BLAS_USM_FN(::blas::_spmv, queue, upper_lower, n, alpha, a, x, incx, beta, y, incy, - dependencies); + dependencies); } sycl::event spr(sycl::queue& queue, oneapi::math::uplo upper_lower, std::int64_t n, real_t alpha, @@ -380,15 +385,15 @@ sycl::event spr2(sycl::queue& queue, oneapi::math::uplo upper_lower, std::int64_ const real_t* x, std::int64_t incx, const real_t* y, std::int64_t incy, real_t* a, const std::vector& dependencies) { CALL_GENERIC_BLAS_USM_FN(::blas::_spr2, queue, upper_lower, n, alpha, x, incx, y, incy, a, - dependencies); + dependencies); } sycl::event tbmv(sycl::queue& queue, oneapi::math::uplo upper_lower, oneapi::math::transpose trans, oneapi::math::diag unit_diag, std::int64_t n, std::int64_t k, const real_t* a, std::int64_t lda, real_t* x, std::int64_t incx, const std::vector& dependencies) { - CALL_GENERIC_BLAS_USM_FN(::blas::_tbmv, queue, upper_lower, trans, unit_diag, n, k, a, lda, x, incx, - dependencies); + CALL_GENERIC_BLAS_USM_FN(::blas::_tbmv, queue, upper_lower, trans, unit_diag, n, k, a, lda, x, + incx, dependencies); } sycl::event tbmv(sycl::queue& queue, oneapi::math::uplo upper_lower, oneapi::math::transpose trans, @@ -402,8 +407,8 @@ sycl::event tbsv(sycl::queue& queue, oneapi::math::uplo upper_lower, oneapi::mat oneapi::math::diag unit_diag, std::int64_t n, std::int64_t k, const real_t* a, std::int64_t lda, real_t* x, std::int64_t incx, const std::vector& dependencies) { - CALL_GENERIC_BLAS_USM_FN(::blas::_tbsv, queue, upper_lower, trans, unit_diag, n, k, a, lda, x, incx, - dependencies); + CALL_GENERIC_BLAS_USM_FN(::blas::_tbsv, queue, upper_lower, trans, unit_diag, n, k, a, lda, x, + incx, dependencies); } sycl::event tbsv(sycl::queue& queue, oneapi::math::uplo upper_lower, oneapi::math::transpose trans, @@ -417,7 +422,7 @@ sycl::event tpmv(sycl::queue& queue, oneapi::math::uplo upper_lower, oneapi::mat oneapi::math::diag unit_diag, std::int64_t n, const real_t* a, real_t* x, std::int64_t incx, const std::vector& dependencies) { CALL_GENERIC_BLAS_USM_FN(::blas::_tpmv, queue, upper_lower, trans, unit_diag, n, a, x, incx, - dependencies); + dependencies); } sycl::event tpmv(sycl::queue& queue, oneapi::math::uplo upper_lower, oneapi::math::transpose trans, @@ -431,7 +436,7 @@ sycl::event tpsv(sycl::queue& queue, oneapi::math::uplo upper_lower, oneapi::mat oneapi::math::diag unit_diag, std::int64_t n, const real_t* a, real_t* x, std::int64_t incx, const std::vector& dependencies) { CALL_GENERIC_BLAS_USM_FN(::blas::_tpsv, queue, upper_lower, trans, unit_diag, n, a, x, incx, - dependencies); + dependencies); } sycl::event tpsv(sycl::queue& queue, oneapi::math::uplo upper_lower, oneapi::math::transpose trans, @@ -444,8 +449,8 @@ sycl::event tpsv(sycl::queue& queue, oneapi::math::uplo upper_lower, oneapi::mat sycl::event trmv(sycl::queue& queue, oneapi::math::uplo upper_lower, oneapi::math::transpose trans, oneapi::math::diag unit_diag, std::int64_t n, const real_t* a, std::int64_t lda, real_t* x, std::int64_t incx, const std::vector& dependencies) { - CALL_GENERIC_BLAS_USM_FN(::blas::_trmv, queue, upper_lower, trans, unit_diag, n, a, lda, x, incx, - dependencies); + CALL_GENERIC_BLAS_USM_FN(::blas::_trmv, queue, upper_lower, trans, unit_diag, n, a, lda, x, + incx, dependencies); } sycl::event trmv(sycl::queue& queue, oneapi::math::uplo upper_lower, oneapi::math::transpose trans, @@ -458,8 +463,8 @@ sycl::event trmv(sycl::queue& queue, oneapi::math::uplo upper_lower, oneapi::mat sycl::event trsv(sycl::queue& queue, oneapi::math::uplo upper_lower, oneapi::math::transpose trans, oneapi::math::diag unit_diag, std::int64_t n, const real_t* a, std::int64_t lda, real_t* x, std::int64_t incx, const std::vector& dependencies) { - CALL_GENERIC_BLAS_USM_FN(::blas::_trsv, queue, upper_lower, trans, unit_diag, n, a, lda, x, incx, - dependencies); + CALL_GENERIC_BLAS_USM_FN(::blas::_trsv, queue, upper_lower, trans, unit_diag, n, a, lda, x, + incx, dependencies); } sycl::event trsv(sycl::queue& queue, oneapi::math::uplo upper_lower, oneapi::math::transpose trans, diff --git a/src/blas/backends/generic/generic_level3.cxx b/src/blas/backends/generic/generic_level3.cxx index 39eb9e9b4..254db5507 100644 --- a/src/blas/backends/generic/generic_level3.cxx +++ b/src/blas/backends/generic/generic_level3.cxx @@ -23,8 +23,8 @@ void gemm(sycl::queue& queue, oneapi::math::transpose transa, oneapi::math::tran std::int64_t m, std::int64_t n, std::int64_t k, real_t alpha, sycl::buffer& a, std::int64_t lda, sycl::buffer& b, std::int64_t ldb, real_t beta, sycl::buffer& c, std::int64_t ldc) { - CALL_GENERIC_BLAS_FN(::blas::_gemm, queue, transa, transb, m, n, k, alpha, a, lda, b, ldb, beta, c, - ldc); + CALL_GENERIC_BLAS_FN(::blas::_gemm, queue, transa, transb, m, n, k, alpha, a, lda, b, ldb, beta, + c, ldc); } void gemm(sycl::queue& queue, oneapi::math::transpose transa, oneapi::math::transpose transb, @@ -35,7 +35,8 @@ void gemm(sycl::queue& queue, oneapi::math::transpose transa, oneapi::math::tran using sycl_complex_real_t = sycl::ext::oneapi::experimental::complex; if (transa == oneapi::math::transpose::conjtrans || transb == oneapi::math::transpose::conjtrans) { - throw unimplemented("blas", "gemm", "Conjugate Transpose unsupported yet on onemath_sycl_blas"); + throw unimplemented("blas", "gemm", + "Conjugate Transpose unsupported yet on onemath_sycl_blas"); } // Intermediate buffers for conversion purposes as onemath_sycl_blas expects sycl::complex instead of std::complex sycl::buffer a_pb{ sycl::range<1>(a.size()) }; @@ -55,7 +56,7 @@ void gemm(sycl::queue& queue, oneapi::math::transpose transa, oneapi::math::tran queue.copy(c_acc, c_pb_acc); CALL_GENERIC_BLAS_FN(::blas::_gemm, queue, transa, transb, m, n, k, alpha, a_pb, lda, b_pb, ldb, - beta, c_pb, ldc); + beta, c_pb, ldc); // Copy c_pb back to c sycl::accessor, 1, sycl::access::mode::write> out_acc(c); @@ -68,7 +69,7 @@ void symm(sycl::queue& queue, oneapi::math::side left_right, oneapi::math::uplo std::int64_t lda, sycl::buffer& b, std::int64_t ldb, real_t beta, sycl::buffer& c, std::int64_t ldc) { CALL_GENERIC_BLAS_FN(::blas::_symm, queue, left_right, upper_lower, m, n, alpha, a, lda, b, ldb, - beta, c, ldc); + beta, c, ldc); } void symm(sycl::queue& queue, oneapi::math::side left_right, oneapi::math::uplo upper_lower, @@ -148,8 +149,8 @@ void trsm(sycl::queue& queue, oneapi::math::side left_right, oneapi::math::uplo oneapi::math::transpose trans, oneapi::math::diag unit_diag, std::int64_t m, std::int64_t n, real_t alpha, sycl::buffer& a, std::int64_t lda, sycl::buffer& b, std::int64_t ldb) { - CALL_GENERIC_BLAS_FN(::blas::_trsm, queue, left_right, upper_lower, trans, unit_diag, m, n, alpha, - a, lda, b, ldb); + CALL_GENERIC_BLAS_FN(::blas::_trsm, queue, left_right, upper_lower, trans, unit_diag, m, n, + alpha, a, lda, b, ldb); } void trsm(sycl::queue& queue, oneapi::math::side left_right, oneapi::math::uplo upper_lower, @@ -190,7 +191,7 @@ void omatcopy2(sycl::queue& queue, transpose trans, std::int64_t m, std::int64_t sycl::buffer& a, std::int64_t lda, std::int64_t stridea, sycl::buffer& b, std::int64_t ldb, std::int64_t strideb) { CALL_GENERIC_BLAS_FN(::blas::_omatcopy2, queue, trans, m, n, alpha, a, lda, stridea, b, ldb, - strideb); + strideb); } void omatcopy2(sycl::queue& queue, transpose trans, std::int64_t m, std::int64_t n, @@ -215,8 +216,8 @@ void omatadd(sycl::queue& queue, transpose transa, transpose transb, std::int64_ real_t alpha, sycl::buffer& a, std::int64_t lda, real_t beta, sycl::buffer& b, std::int64_t ldb, sycl::buffer& c, std::int64_t ldc) { - CALL_GENERIC_BLAS_FN(::blas::_omatadd, queue, transa, transb, m, n, alpha, a, lda, beta, b, ldb, c, - ldc); + CALL_GENERIC_BLAS_FN(::blas::_omatadd, queue, transa, transb, m, n, alpha, a, lda, beta, b, ldb, + c, ldc); } void omatadd(sycl::queue& queue, transpose transa, transpose transb, std::int64_t m, std::int64_t n, @@ -232,8 +233,8 @@ sycl::event gemm(sycl::queue& queue, oneapi::math::transpose transa, oneapi::mat std::int64_t m, std::int64_t n, std::int64_t k, real_t alpha, const real_t* a, std::int64_t lda, const real_t* b, std::int64_t ldb, real_t beta, real_t* c, std::int64_t ldc, const std::vector& dependencies) { - CALL_GENERIC_BLAS_USM_FN(::blas::_gemm, queue, transa, transb, m, n, k, alpha, a, lda, b, ldb, beta, - c, ldc, dependencies); + CALL_GENERIC_BLAS_USM_FN(::blas::_gemm, queue, transa, transb, m, n, k, alpha, a, lda, b, ldb, + beta, c, ldc, dependencies); } sycl::event gemm(sycl::queue& queue, oneapi::math::transpose transa, oneapi::math::transpose transb, @@ -243,18 +244,19 @@ sycl::event gemm(sycl::queue& queue, oneapi::math::transpose transa, oneapi::mat std::int64_t ldc, const std::vector& dependencies) { if (transa == oneapi::math::transpose::conjtrans || transb == oneapi::math::transpose::conjtrans) { - throw unimplemented("blas", "gemm", "Conjugate Transpose unsupported yet on onemath_sycl_blas"); + throw unimplemented("blas", "gemm", + "Conjugate Transpose unsupported yet on onemath_sycl_blas"); } - CALL_GENERIC_BLAS_USM_FN(::blas::_gemm, queue, transa, transb, m, n, k, alpha, a, lda, b, ldb, beta, - c, ldc, dependencies); + CALL_GENERIC_BLAS_USM_FN(::blas::_gemm, queue, transa, transb, m, n, k, alpha, a, lda, b, ldb, + beta, c, ldc, dependencies); } sycl::event symm(sycl::queue& queue, oneapi::math::side left_right, oneapi::math::uplo upper_lower, std::int64_t m, std::int64_t n, real_t alpha, const real_t* a, std::int64_t lda, const real_t* b, std::int64_t ldb, real_t beta, real_t* c, std::int64_t ldc, const std::vector& dependencies) { - CALL_GENERIC_BLAS_USM_FN(::blas::_symm, queue, left_right, upper_lower, m, n, alpha, a, lda, b, ldb, - beta, c, ldc, dependencies); + CALL_GENERIC_BLAS_USM_FN(::blas::_symm, queue, left_right, upper_lower, m, n, alpha, a, lda, b, + ldb, beta, c, ldc, dependencies); } sycl::event symm(sycl::queue& queue, oneapi::math::side left_right, oneapi::math::uplo upper_lower, @@ -338,7 +340,7 @@ sycl::event trsm(sycl::queue& queue, oneapi::math::side left_right, oneapi::math std::int64_t n, real_t alpha, const real_t* a, std::int64_t lda, real_t* b, std::int64_t ldb, const std::vector& dependencies) { CALL_GENERIC_BLAS_USM_FN(::blas::_trsm, queue, left_right, upper_lower, trans, unit_diag, m, n, - alpha, a, lda, b, ldb, dependencies); + alpha, a, lda, b, ldb, dependencies); } sycl::event trsm(sycl::queue& queue, oneapi::math::side left_right, oneapi::math::uplo upper_lower, @@ -370,7 +372,7 @@ sycl::event omatcopy(sycl::queue& queue, transpose trans, std::int64_t m, std::i real_t alpha, const real_t* a, std::int64_t lda, real_t* b, std::int64_t ldb, const std::vector& dependencies) { CALL_GENERIC_BLAS_USM_FN(::blas::_omatcopy, queue, trans, m, n, alpha, a, lda, b, ldb, - dependencies); + dependencies); } sycl::event omatcopy(sycl::queue& queue, transpose trans, std::int64_t m, std::int64_t n, @@ -385,7 +387,7 @@ sycl::event omatcopy2(sycl::queue& queue, transpose trans, std::int64_t m, std:: real_t* b, std::int64_t ldb, std::int64_t strideb, const std::vector& dependencies) { CALL_GENERIC_BLAS_USM_FN(::blas::_omatcopy2, queue, trans, m, n, alpha, a, lda, stridea, b, ldb, - strideb, dependencies); + strideb, dependencies); } sycl::event omatcopy2(sycl::queue& queue, transpose trans, std::int64_t m, std::int64_t n, @@ -411,8 +413,8 @@ sycl::event omatadd(sycl::queue& queue, transpose transa, transpose transb, std: std::int64_t n, real_t alpha, const real_t* a, std::int64_t lda, real_t beta, const real_t* b, std::int64_t ldb, real_t* c, std::int64_t ldc, const std::vector& dependencies) { - CALL_GENERIC_BLAS_USM_FN(::blas::_omatadd, queue, transa, transb, m, n, alpha, a, lda, beta, b, ldb, - c, ldc, dependencies); + CALL_GENERIC_BLAS_USM_FN(::blas::_omatadd, queue, transa, transb, m, n, alpha, a, lda, beta, b, + ldb, c, ldc, dependencies); } sycl::event omatadd(sycl::queue& queue, transpose transa, transpose transb, std::int64_t m, diff --git a/tests/unit_tests/include/test_helper.hpp b/tests/unit_tests/include/test_helper.hpp index f61e3ae0e..d813e7eaa 100644 --- a/tests/unit_tests/include/test_helper.hpp +++ b/tests/unit_tests/include/test_helper.hpp @@ -226,7 +226,7 @@ TEST_RUN_AMDGPU_ROCBLAS_SELECT(q, func, __VA_ARGS__); \ } \ } \ - TEST_RUN_GENERIC_BLAS_SELECT(q, func, __VA_ARGS__); \ + TEST_RUN_GENERIC_BLAS_SELECT(q, func, __VA_ARGS__); \ } while (0); #define TEST_RUN_RNG_CT_SELECT(q, func, ...) \ diff --git a/tests/unit_tests/main_test.cpp b/tests/unit_tests/main_test.cpp index b63e8f9ac..3fc4a490f 100644 --- a/tests/unit_tests/main_test.cpp +++ b/tests/unit_tests/main_test.cpp @@ -112,13 +112,13 @@ int main(int argc, char** argv) { if (unique_devices.find(dev.get_info()) == unique_devices.end()) { unique_devices.insert(dev.get_info()); -#if !defined(ONEMATH_ENABLE_MKLCPU_BACKEND) && \ +#if !defined(ONEMATH_ENABLE_MKLCPU_BACKEND) && \ !defined(ONEMATH_ENABLE_GENERIC_BLAS_BACKEND_INTEL_CPU) && \ !defined(ONEMATH_ENABLE_PORTFFT_BACKEND) && !defined(ONEMATH_ENABLE_NETLIB_BACKEND) if (dev.is_cpu()) continue; #endif -#if !defined(ONEMATH_ENABLE_MKLGPU_BACKEND) && \ +#if !defined(ONEMATH_ENABLE_MKLGPU_BACKEND) && \ !defined(ONEMATH_ENABLE_GENERIC_BLAS_BACKEND_INTEL_GPU) && \ !defined(ONEMATH_ENABLE_PORTFFT_BACKEND) if (dev.is_gpu() && vendor_id == INTEL_ID) @@ -126,7 +126,7 @@ int main(int argc, char** argv) { #endif #if !defined(ONEMATH_ENABLE_CUBLAS_BACKEND) && !defined(ONEMATH_ENABLE_CURAND_BACKEND) && \ !defined(ONEMATH_ENABLE_CUSOLVER_BACKEND) && \ - !defined(ONEMATH_ENABLE_GENERIC_BLAS_BACKEND_NVIDIA_GPU) && \ + !defined(ONEMATH_ENABLE_GENERIC_BLAS_BACKEND_NVIDIA_GPU) && \ !defined(ONEMATH_ENABLE_CUFFT_BACKEND) && !defined(ONEMATH_ENABLE_PORTFFT_BACKEND) && \ !defined(ONEMATH_ENABLE_CUSPARSE_BACKEND) if (dev.is_gpu() && vendor_id == NVIDIA_ID) @@ -134,7 +134,7 @@ int main(int argc, char** argv) { #endif #if !defined(ONEMATH_ENABLE_ROCBLAS_BACKEND) && !defined(ONEMATH_ENABLE_ROCRAND_BACKEND) && \ !defined(ONEMATH_ENABLE_ROCSOLVER_BACKEND) && \ - !defined(ONEMATH_ENABLE_GENERIC_BLAS_BACKEND_AMD_GPU) && \ + !defined(ONEMATH_ENABLE_GENERIC_BLAS_BACKEND_AMD_GPU) && \ !defined(ONEMATH_ENABLE_ROCFFT_BACKEND) && !defined(ONEMATH_ENABLE_PORTFFT_BACKEND) if (dev.is_gpu() && vendor_id == AMD_ID) continue;