From 262cf77ff544df5527139f2100e1f6a2807b1d22 Mon Sep 17 00:00:00 2001 From: anton aksenov Date: Tue, 14 Jan 2025 09:46:03 +0300 Subject: [PATCH] 4.2.2 task done --- src/cl/matrix_multiplication.cl | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/src/cl/matrix_multiplication.cl b/src/cl/matrix_multiplication.cl index da9154c..8f9d386 100644 --- a/src/cl/matrix_multiplication.cl +++ b/src/cl/matrix_multiplication.cl @@ -94,7 +94,7 @@ __kernel void matrix_multiplication_local_wpt( for (int tile_start = 0; tile_start < (K + TILE_SIZE - 1) / TILE_SIZE; tile_start++) { for (int w = 0; w < WORK_PER_THREAD; w++) { tile_a[local_j * WORK_PER_THREAD + w][local_i] = as[(tile_start * TILE_SIZE + local_i) + (j * WORK_PER_THREAD + w) * K]; - tile_b[local_j * WORK_PER_THREAD + w][local_i] = bs[(local_i) + (tile_start * TILE_SIZE + local_j * WORK_PER_THREAD + w) * N]; + tile_b[local_j * WORK_PER_THREAD + w][local_i] = bs[(i) + (tile_start * TILE_SIZE + local_j * WORK_PER_THREAD + w) * N]; } barrier(CLK_LOCAL_MEM_FENCE);