Skip to content

Commit

Permalink
fix < 128
Browse files Browse the repository at this point in the history
Signed-off-by: Lucas Wilkinson <lwilkinson@neuralmagic.com>
  • Loading branch information
LucasWilkinson committed Feb 25, 2025
1 parent b42a7b4 commit 7f541db
Showing 1 changed file with 4 additions and 2 deletions.
Original file line number Diff line number Diff line change
Expand Up @@ -457,12 +457,14 @@ struct CollectiveMma<

#pragma unroll
for (int i = 0; i < size(tApA_ScaleA); ++i) {
tApA_ScaleA(i) = get<0>(tAcA_ScaleA(i)) < scales_m;
tApA_ScaleA(i) = get<0>(tAcA_ScaleA(i)) <
std::min(scales_m, (m_coord + 1) * ScaleMsPerTile);
}

#pragma unroll
for (int i = 0; i < size(tApA_ScaleA); ++i) {
tBpB_ScaleB(i) = get<0>(tBcB_ScaleB(i)) < scales_n;
tBpB_ScaleB(i) = get<0>(tBcB_ScaleB(i)) <
std::min(scales_n, (n_coord + 1) * ScaleNsPerTile);
}

// Mainloop
Expand Down

0 comments on commit 7f541db

Please sign in to comment.