From bb43d5e1e4c96aba47507cfa3bd91b78ed355ba1 Mon Sep 17 00:00:00 2001 From: MaxAkaAltmer Date: Sun, 1 Sep 2024 17:47:09 +0300 Subject: [PATCH 1/2] Include of regular_tile_iterator.h fixed for NVRTC --- .../transform/threadblock/regular_tile_iterator_pitch_linear.h | 2 +- .../regular_tile_iterator_pitch_linear_2dthreadtile.h | 2 +- 2 files changed, 2 insertions(+), 2 deletions(-) diff --git a/include/cutlass/transform/threadblock/regular_tile_iterator_pitch_linear.h b/include/cutlass/transform/threadblock/regular_tile_iterator_pitch_linear.h index 1dfde983e9..1e04c4262d 100644 --- a/include/cutlass/transform/threadblock/regular_tile_iterator_pitch_linear.h +++ b/include/cutlass/transform/threadblock/regular_tile_iterator_pitch_linear.h @@ -45,7 +45,7 @@ #include "cutlass/layout/matrix.h" #include "cutlass/layout/pitch_linear.h" -#include "regular_tile_iterator.h" +#include "cutlass/transform/threadblock/regular_tile_iterator.h" ///////////////////////////////////////////////////////////////////////////////////////////////// diff --git a/include/cutlass/transform/threadblock/regular_tile_iterator_pitch_linear_2dthreadtile.h b/include/cutlass/transform/threadblock/regular_tile_iterator_pitch_linear_2dthreadtile.h index a62ff8dd6b..7fd4959845 100644 --- a/include/cutlass/transform/threadblock/regular_tile_iterator_pitch_linear_2dthreadtile.h +++ b/include/cutlass/transform/threadblock/regular_tile_iterator_pitch_linear_2dthreadtile.h @@ -45,7 +45,7 @@ #include "cutlass/layout/matrix.h" #include "cutlass/layout/pitch_linear.h" -#include "regular_tile_iterator.h" +#include "cutlass/transform/threadblock/regular_tile_iterator.h" ///////////////////////////////////////////////////////////////////////////////////////////////// From c9da4788e75a2702a74ac8ef99ecc29b62adc00b Mon Sep 17 00:00:00 2001 From: MaxAkaAltmer Date: Sun, 1 Sep 2024 23:19:01 +0300 Subject: [PATCH 2/2] More include fixed for NVRTC --- include/cutlass/epilogue/threadblock/default_thread_map_simt.h | 2 +- .../cutlass/epilogue/threadblock/default_thread_map_tensor_op.h | 2 +- .../epilogue/threadblock/default_thread_map_volta_tensor_op.h | 2 +- .../epilogue/threadblock/default_thread_map_wmma_tensor_op.h | 2 +- 4 files changed, 4 insertions(+), 4 deletions(-) diff --git a/include/cutlass/epilogue/threadblock/default_thread_map_simt.h b/include/cutlass/epilogue/threadblock/default_thread_map_simt.h index a5559f67a4..2092caf4d7 100644 --- a/include/cutlass/epilogue/threadblock/default_thread_map_simt.h +++ b/include/cutlass/epilogue/threadblock/default_thread_map_simt.h @@ -35,7 +35,7 @@ #pragma once -#include "predicated_tile_iterator.h" +#include "cutlass/epilogue/threadblock/predicated_tile_iterator.h" #include "cutlass/gemm/gemm.h" ///////////////////////////////////////////////////////////////////////////////////////////////// diff --git a/include/cutlass/epilogue/threadblock/default_thread_map_tensor_op.h b/include/cutlass/epilogue/threadblock/default_thread_map_tensor_op.h index e4198dc42d..e39ca9d539 100644 --- a/include/cutlass/epilogue/threadblock/default_thread_map_tensor_op.h +++ b/include/cutlass/epilogue/threadblock/default_thread_map_tensor_op.h @@ -35,7 +35,7 @@ #pragma once -#include "predicated_tile_iterator.h" +#include "cutlass/epilogue/threadblock/predicated_tile_iterator.h" #include "cutlass/gemm/gemm.h" #include "cutlass/layout/pitch_linear.h" diff --git a/include/cutlass/epilogue/threadblock/default_thread_map_volta_tensor_op.h b/include/cutlass/epilogue/threadblock/default_thread_map_volta_tensor_op.h index f0ccd74e65..1eac4a1834 100644 --- a/include/cutlass/epilogue/threadblock/default_thread_map_volta_tensor_op.h +++ b/include/cutlass/epilogue/threadblock/default_thread_map_volta_tensor_op.h @@ -35,7 +35,7 @@ #pragma once -#include "predicated_tile_iterator.h" +#include "cutlass/epilogue/threadblock/predicated_tile_iterator.h" #include "cutlass/gemm/gemm.h" ///////////////////////////////////////////////////////////////////////////////////////////////// diff --git a/include/cutlass/epilogue/threadblock/default_thread_map_wmma_tensor_op.h b/include/cutlass/epilogue/threadblock/default_thread_map_wmma_tensor_op.h index 9f01d1fffc..0dccf6525a 100644 --- a/include/cutlass/epilogue/threadblock/default_thread_map_wmma_tensor_op.h +++ b/include/cutlass/epilogue/threadblock/default_thread_map_wmma_tensor_op.h @@ -35,7 +35,7 @@ #pragma once -#include "predicated_tile_iterator.h" +#include "cutlass/epilogue/threadblock/predicated_tile_iterator.h" #include "cutlass/gemm/gemm.h" #include "cutlass/layout/pitch_linear.h"