Skip to content

Commit

Permalink
Genral Formatting
Browse files Browse the repository at this point in the history
  • Loading branch information
OuadiElfarouki committed Jul 28, 2023
1 parent 5821b1a commit cf2f38c
Show file tree
Hide file tree
Showing 5 changed files with 15 additions and 17 deletions.
8 changes: 4 additions & 4 deletions benchmark/syclblas/extension/omatcopy.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -77,8 +77,8 @@ void run(benchmark::State& state, blas::SB_Handle* sb_handle_ptr, int ti,
auto m_b_temp_gpu =
blas::make_sycl_iterator_buffer<scalar_t>(m_b_temp, size_b);

auto event = blas::_omatcopy(sb_handle, *t_str, m, n, alpha,
m_a_gpu, lda, m_b_temp_gpu, ldb);
auto event = blas::_omatcopy(sb_handle, *t_str, m, n, alpha, m_a_gpu, lda,
m_b_temp_gpu, ldb);

sb_handle.wait();
}
Expand All @@ -92,8 +92,8 @@ void run(benchmark::State& state, blas::SB_Handle* sb_handle_ptr, int ti,
#endif

auto blas_method_def = [&]() -> std::vector<cl::sycl::event> {
auto event = blas::_omatcopy(sb_handle, *t_str, m, n, alpha,
m_a_gpu, lda, m_b_gpu, ldb);
auto event = blas::_omatcopy(sb_handle, *t_str, m, n, alpha, m_a_gpu, lda,
m_b_gpu, ldb);
sb_handle.wait(event);
return event;
};
Expand Down
10 changes: 5 additions & 5 deletions include/interface/extension_interface.h
Original file line number Diff line number Diff line change
Expand Up @@ -179,8 +179,8 @@ template <typename element_t, typename sb_handle_t, typename index_t,
typename sb_handle_t::event_t _transpose(sb_handle_t& sb_handle, index_t m,
index_t n, in_t A, index_t ld_in,
index_t ld_out) {
return blas::internal::_transpose<true, element_t>(sb_handle, m, n, A, ld_in, A,
ld_out);
return blas::internal::_transpose<true, element_t>(sb_handle, m, n, A, ld_in,
A, ld_out);
}

/**
Expand All @@ -207,8 +207,8 @@ template <typename element_t, typename sb_handle_t, typename index_t,
typename sb_handle_t::event_t _transpose(sb_handle_t& sb_handle, index_t m,
index_t n, in_t A, index_t ld_a,
out_t B, index_t ld_b) {
return blas::internal::_transpose<false, element_t>(sb_handle, m, n, A, ld_a, B,
ld_b);
return blas::internal::_transpose<false, element_t>(sb_handle, m, n, A, ld_a,
B, ld_b);
}

template <typename operator_t, typename element_t, typename sb_handle_t,
Expand All @@ -222,7 +222,7 @@ typename sb_handle_t::event_t _reduction(sb_handle_t& sb_handle,
sb_handle, buffer_in, ld, buffer_out, rows, cols, reduction_dim);
}

} // namespace extension
} // namespace extension

} // namespace blas

Expand Down
6 changes: 2 additions & 4 deletions src/interface/extension/backend/nvidia_gpu.hpp
Original file line number Diff line number Diff line change
Expand Up @@ -37,14 +37,12 @@ typename sb_handle_t::event_t _transpose_outplace(
container_0_t in_, index_t _ld_in, index_t _inc_in, container_1_t out_,
index_t _ld_out, index_t _inc_out) {
if (_M * _N > (1 << 18)) {
return blas::internal::_transpose_outplace_impl<32, 512, 128,
true>(
return blas::internal::_transpose_outplace_impl<32, 512, 128, true>(
sb_handle, _M, _N, _alpha, in_, _ld_in, _inc_in, out_, _ld_out,
_inc_out);

} else {
return blas::internal::_transpose_outplace_impl<32, 128, 128,
true>(
return blas::internal::_transpose_outplace_impl<32, 128, 128, true>(
sb_handle, _M, _N, _alpha, in_, _ld_in, _inc_in, out_, _ld_out,
_inc_out);
}
Expand Down
4 changes: 2 additions & 2 deletions test/unittest/extension/omatcopy2_test.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -71,8 +71,8 @@ void run_test(const combination_t<scalar_t> combi) {
auto matrix_in = blas::make_sycl_iterator_buffer<scalar_t>(A, m_a_size);
auto matrix_out = blas::make_sycl_iterator_buffer<scalar_t>(B, m_b_size);

blas::_omatcopy2(sb_handle, trans, m, n, alpha, matrix_in, ld_in,
inc_in, matrix_out, ld_out, inc_out);
blas::_omatcopy2(sb_handle, trans, m, n, alpha, matrix_in, ld_in, inc_in,
matrix_out, ld_out, inc_out);

auto event = blas::helper::copy_to_host<scalar_t>(
sb_handle.get_queue(), matrix_out, B.data(), m_b_size);
Expand Down
4 changes: 2 additions & 2 deletions test/unittest/extension/omatcopy_test.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -62,8 +62,8 @@ void run_test(const combination_t<scalar_t> combi) {
auto matrix_in = blas::make_sycl_iterator_buffer<scalar_t>(A, size_a);
auto matrix_out = blas::make_sycl_iterator_buffer<scalar_t>(B, size_b);

blas::_omatcopy(sb_handle, trans, m, n, alpha, matrix_in, ld_in,
matrix_out, ld_out);
blas::_omatcopy(sb_handle, trans, m, n, alpha, matrix_in, ld_in, matrix_out,
ld_out);

auto event = blas::helper::copy_to_host<scalar_t>(
sb_handle.get_queue(), matrix_out, B.data(), size_b);
Expand Down

0 comments on commit cf2f38c

Please sign in to comment.