Skip to content

Commit 596155e

Browse files
committed
Fix error in SYCL's basic data parallel kernel (only manifested in multi-GPU setups): the grid_x_offset and grid_y_offset was swapped.
1 parent 6ec59bb commit 596155e

File tree

1 file changed

+2
-2
lines changed
  • include/plssvm/backends/SYCL/kernel/cg_explicit/basic

1 file changed

+2
-2
lines changed

include/plssvm/backends/SYCL/kernel/cg_explicit/basic/blas.hpp

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -380,8 +380,8 @@ class device_kernel_inplace_matrix_scale {
380380
constexpr auto PADDING_SIZE_uz = static_cast<std::size_t>(PADDING_SIZE);
381381

382382
// calculate the indices used in the current work-item
383-
const auto i_idx = (idx.get_id(1) + grid_x_offset_ * THREAD_BLOCK_SIZE_uz) * INTERNAL_BLOCK_SIZE_uz; // num_rows
384-
const auto j_idx = (idx.get_id(0) + grid_y_offset_ * THREAD_BLOCK_SIZE_uz) * INTERNAL_BLOCK_SIZE_uz; // num_rhs
383+
const auto i_idx = (idx.get_id(1) + grid_y_offset_ * THREAD_BLOCK_SIZE_uz) * INTERNAL_BLOCK_SIZE_uz; // num_rows
384+
const auto j_idx = (idx.get_id(0) + grid_x_offset_ * THREAD_BLOCK_SIZE_uz) * INTERNAL_BLOCK_SIZE_uz; // num_rhs
385385

386386
for (unsigned internal_i = 0; internal_i < INTERNAL_BLOCK_SIZE; ++internal_i) {
387387
for (unsigned internal_j = 0; internal_j < INTERNAL_BLOCK_SIZE; ++internal_j) {

0 commit comments

Comments
 (0)