@@ -143,26 +143,26 @@ int main(int argc, char* argv[])
143143
144144 if (std::is_same<decltype (layout), ck::tensor_layout::gemm::RowMajor>::value)
145145 {
146- return HostTensorDescriptor ({row, col}, {stride, 1_uz});
146+ return ck:: HostTensorDescriptor ({row, col}, {stride, 1_uz});
147147 }
148148 else
149149 {
150- return HostTensorDescriptor ({row, col}, {1_uz, stride});
150+ return ck:: HostTensorDescriptor ({row, col}, {1_uz, stride});
151151 }
152152 };
153153
154- Tensor<A0DataType> a0_m_k (f_host_tensor_descriptor (M, K, StrideA, A0Layout{}));
155- Tensor<A1DataType> a1_m_k (f_host_tensor_descriptor ((M + Scale_Block_M - 1 ) / Scale_Block_M,
156- (K + Scale_Block_K - 1 ) / Scale_Block_K,
157- Scale_Stride_AM,
158- A0Layout{}));
159- Tensor<B0DataType> b0_k_n (f_host_tensor_descriptor (K, N, StrideB, B0Layout{}));
160- Tensor<B1DataType> b1_k_n (f_host_tensor_descriptor ((K + Scale_Block_K - 1 ) / Scale_Block_K,
161- (N + Scale_Block_N - 1 ) / Scale_Block_N,
162- Scale_Stride_BN,
163- B0Layout{}));
164- Tensor<EDataType> e_m_n_host_result (f_host_tensor_descriptor (M, N, StrideE, ELayout{}));
165- Tensor<EDataType> e_m_n_device_result (f_host_tensor_descriptor (M, N, StrideE, ELayout{}));
154+ ck:: Tensor<A0DataType> a0_m_k (f_host_tensor_descriptor (M, K, StrideA, A0Layout{}));
155+ ck:: Tensor<A1DataType> a1_m_k (f_host_tensor_descriptor ((M + Scale_Block_M - 1 ) / Scale_Block_M,
156+ (K + Scale_Block_K - 1 ) / Scale_Block_K,
157+ Scale_Stride_AM,
158+ A0Layout{}));
159+ ck:: Tensor<B0DataType> b0_k_n (f_host_tensor_descriptor (K, N, StrideB, B0Layout{}));
160+ ck:: Tensor<B1DataType> b1_k_n (f_host_tensor_descriptor ((K + Scale_Block_K - 1 ) / Scale_Block_K,
161+ (N + Scale_Block_N - 1 ) / Scale_Block_N,
162+ Scale_Stride_BN,
163+ B0Layout{}));
164+ ck:: Tensor<EDataType> e_m_n_host_result (f_host_tensor_descriptor (M, N, StrideE, ELayout{}));
165+ ck:: Tensor<EDataType> e_m_n_device_result (f_host_tensor_descriptor (M, N, StrideE, ELayout{}));
166166
167167 std::cout << " a0_m_k: " << a0_m_k.mDesc << std::endl;
168168 std::cout << " a1_m_k: " << a1_m_k.mDesc << std::endl;
@@ -210,11 +210,11 @@ int main(int argc, char* argv[])
210210 b1_k_n.GenerateTensorValue (GeneratorTensor_3<B1DataType>{0 , 1.0 });
211211 }
212212
213- DeviceMem a0_device_buf (sizeof (A0DataType) * a0_m_k.mDesc .GetElementSpaceSize ());
214- DeviceMem a1_device_buf (sizeof (A1DataType) * a1_m_k.mDesc .GetElementSpaceSize ());
215- DeviceMem b0_device_buf (sizeof (B0DataType) * b0_k_n.mDesc .GetElementSpaceSize ());
216- DeviceMem b1_device_buf (sizeof (B1DataType) * b1_k_n.mDesc .GetElementSpaceSize ());
217- DeviceMem e_device_buf (sizeof (EDataType) * e_m_n_device_result.mDesc .GetElementSpaceSize ());
213+ ck:: DeviceMem a0_device_buf (sizeof (A0DataType) * a0_m_k.mDesc .GetElementSpaceSize ());
214+ ck:: DeviceMem a1_device_buf (sizeof (A1DataType) * a1_m_k.mDesc .GetElementSpaceSize ());
215+ ck:: DeviceMem b0_device_buf (sizeof (B0DataType) * b0_k_n.mDesc .GetElementSpaceSize ());
216+ ck:: DeviceMem b1_device_buf (sizeof (B1DataType) * b1_k_n.mDesc .GetElementSpaceSize ());
217+ ck:: DeviceMem e_device_buf (sizeof (EDataType) * e_m_n_device_result.mDesc .GetElementSpaceSize ());
218218
219219 a0_device_buf.ToDevice (a0_m_k.mData .data ());
220220 a1_device_buf.ToDevice (a1_m_k.mData .data ());
@@ -269,9 +269,9 @@ int main(int argc, char* argv[])
269269
270270 if (do_verification)
271271 {
272- Tensor<AccDataType> c_m_n ({M, N});
273- Tensor<float > a_m_k ({M, K});
274- Tensor<float > b_k_n ({K, N});
272+ ck:: Tensor<AccDataType> c_m_n ({M, N});
273+ ck:: Tensor<float > a_m_k ({M, K});
274+ ck:: Tensor<float > b_k_n ({K, N});
275275
276276 for (int m = 0 ; m < M; m++)
277277 {
0 commit comments