diff --git a/include/micm/cuda/util/cuda_dense_matrix.hpp b/include/micm/cuda/util/cuda_dense_matrix.hpp index 37a7943c..ba2b6ad9 100644 --- a/include/micm/cuda/util/cuda_dense_matrix.hpp +++ b/include/micm/cuda/util/cuda_dense_matrix.hpp @@ -231,8 +231,10 @@ namespace micm { if constexpr (std::is_same_v) { - // the cudaMemset function only works for integer types and is an asynchronous function: https://docs.nvidia.com/cuda/cuda-runtime-api/group__CUDART__MEMORY.html#group__CUDART__MEMORY_1gf7338650f7683c51ee26aadc6973c63a - CHECK_CUDA_ERROR(cudaMemset(this->param_.d_data_, val, sizeof(double) * this->param_.number_of_elements_), "cudaMemset"); + // the cudaMemset function only works for integer types and is an asynchronous function: + // https://docs.nvidia.com/cuda/cuda-runtime-api/group__CUDART__MEMORY.html#group__CUDART__MEMORY_1gf7338650f7683c51ee26aadc6973c63a + CHECK_CUDA_ERROR( + cudaMemset(this->param_.d_data_, val, sizeof(double) * this->param_.number_of_elements_), "cudaMemset"); } else { diff --git a/include/micm/cuda/util/cuda_matrix.cuh b/include/micm/cuda/util/cuda_matrix.cuh index bd654dac..f68efef6 100644 --- a/include/micm/cuda/util/cuda_matrix.cuh +++ b/include/micm/cuda/util/cuda_matrix.cuh @@ -41,7 +41,6 @@ namespace micm /// @returns Error code from copying to destination device memory from source device memory, if any cudaError_t CopyToDeviceFromDevice(CudaMatrixParam& vectorMatrixDest, const CudaMatrixParam& vectorMatrixSrc); - /// @brief Fills a CUDA matrix with a specified value /// @param param Struct containing allocated device memory /// @param val Value to fill the matrix with diff --git a/include/micm/cuda/util/cuda_sparse_matrix.hpp b/include/micm/cuda/util/cuda_sparse_matrix.hpp index a40fc81a..25a92d4b 100644 --- a/include/micm/cuda/util/cuda_sparse_matrix.hpp +++ b/include/micm/cuda/util/cuda_sparse_matrix.hpp @@ -131,8 +131,10 @@ namespace micm { if constexpr (std::is_same_v) { - // the cudaMemset function only works for integer types and is an asynchronous function: https://docs.nvidia.com/cuda/cuda-runtime-api/group__CUDART__MEMORY.html#group__CUDART__MEMORY_1gf7338650f7683c51ee26aadc6973c63a - CHECK_CUDA_ERROR(cudaMemset(this->param_.d_data_, val, sizeof(double) * this->param_.number_of_elements_), "cudaMemset"); + // the cudaMemset function only works for integer types and is an asynchronous function: + // https://docs.nvidia.com/cuda/cuda-runtime-api/group__CUDART__MEMORY.html#group__CUDART__MEMORY_1gf7338650f7683c51ee26aadc6973c63a + CHECK_CUDA_ERROR( + cudaMemset(this->param_.d_data_, val, sizeof(double) * this->param_.number_of_elements_), "cudaMemset"); } else { diff --git a/src/util/cuda_matrix.cu b/src/util/cuda_matrix.cu index 1f4b9736..cc0e373a 100644 --- a/src/util/cuda_matrix.cu +++ b/src/util/cuda_matrix.cu @@ -1,8 +1,9 @@ // Copyright (C) 2023-2024 National Center for Atmospheric Research // SPDX-License-Identifier: Apache-2.0 #include -#include #include +#include + #include #include