Added cudaWarnIfError/OPM_CUDA_WARN_IF_ERROR

2025-02-25 18:55:30 -06:00 · 2023-05-09 14:13:32 +02:00
parent cab0efeec5
commit 863647f592
1 changed files with 98 additions and 10 deletions
--- a/opm/simulators/linalg/cuistl/detail/cuda_safe_call.hpp
+++ b/opm/simulators/linalg/cuistl/detail/cuda_safe_call.hpp
@@ -21,10 +21,43 @@
 #include <cuda_runtime.h>
 #include <fmt/core.h>
 #include <opm/common/ErrorMacros.hpp>
+#include <opm/common/OpmLog/OpmLog.hpp>
 #include <string_view>

 namespace Opm::cuistl::detail
 {
+/**
+ * @brief getCudaErrorMessage generates the error message to display for a given error.
+ *
+ * @param error the error code from cublas
+ * @param expression the expresison (say "cudaMalloc(&pointer, 1)")
+ * @param filename the code file the error occured in (typically __FILE__)
+ * @param functionName name of the function the error occured in (typically __func__)
+ * @param lineNumber the line number the error occured in (typically __LINE__)
+ *
+ * @todo Refactor to use std::source_location once we shift to C++20
+ *
+ * @return An error message to be displayed.
+ *
+ * @note This function is mostly for internal use.
+ */
+inline std::string
+getCudaErrorMessage(cudaError_t error,
+                    const std::string_view& expression,
+                    const std::string_view& filename,
+                    const std::string_view& functionName,
+                    size_t lineNumber)
+{
+    return fmt::format("CUDA expression did not execute correctly. Expression was: \n"
+                       "    {}\n"
+                       "CUDA error was {}\n"
+                       "in function {}, in {}, at line {}\n",
+                       expression,
+                       cudaGetErrorString(error),
+                       functionName,
+                       filename,
+                       lineNumber);
+}

 /**
 * @brief cudaSafeCall checks the return type of the CUDA expression (function call) and throws an exception if it
@@ -53,18 +86,52 @@ cudaSafeCall(cudaError_t error,
             size_t lineNumber)
 {
    if (error != cudaSuccess) {
-        OPM_THROW(std::runtime_error,
-                  fmt::format("CUDA expression did not execute correctly. Expression was: \n"
-                              "    {}\n"
-                              "CUDA error was {}\n"
-                              "in function {}, in {}, at line {}\n",
-                              expression,
-                              cudaGetErrorString(error),
-                              functionName,
-                              filename,
-                              lineNumber));
+        OPM_THROW(std::runtime_error, getCudaErrorMessage(error, expression, filename, functionName, lineNumber));
    }
 }
+
+/**
+ * @brief cudaWarnIfError checks the return type of the CUDA expression (function call) and issues a warning if it
+ * does not equal cudaSuccess.
+ *
+ * @param error the error code from cublas
+ * @param expression the expresison (say "cudaMalloc(&pointer, 1)")
+ * @param filename the code file the error occured in (typically __FILE__)
+ * @param functionName name of the function the error occured in (typically __func__)
+ * @param lineNumber the line number the error occured in (typically __LINE__)
+ *
+ * @return the error sent in (for convenience).
+ *
+ * Example usage:
+ * @code{.cpp}
+ * #include <opm/simulators/linalg/cuistl/detail/cuda_safe_call.hpp>
+ * #include <cuda_runtime.h>
+ *
+ * void some_function() {
+ *     void* somePointer;
+ *     cudaWarnIfError(cudaMalloc(&somePointer, 1), "cudaMalloc(&somePointer, 1)", __FILE__, __func__, __LINE__);
+ * }
+ * @endcode
+ *
+ * @note It is probably easier to use the macro OPM_CUDA_WARN_IF_ERROR
+ *
+ * @note Prefer the cudaSafeCall/OPM_CUDA_SAFE_CALL counterpart unless you really don't want to throw an exception.
+ *
+ * @todo Refactor to use std::source_location once we shift to C++20
+ */
+inline cudaError_t
+cudaWarnIfError(cudaError_t error,
+                const std::string_view& expression,
+                const std::string_view& filename,
+                const std::string_view& functionName,
+                size_t lineNumber)
+{
+    if (error != cudaSuccess) {
+        OpmLog::warning(getCudaErrorMessage(error, expression, filename, functionName, lineNumber));
+    }
+
+    return error;
+}
 } // namespace Opm::cuistl::detail

 /**
@@ -87,4 +154,25 @@ cudaSafeCall(cudaError_t error,
 #define OPM_CUDA_SAFE_CALL(expression)                                                                                 \
    ::Opm::cuistl::detail::cudaSafeCall(expression, #expression, __FILE__, __func__, __LINE__)

+
+/**
+ * @brief OPM_CUDA_WARN_IF_ERROR checks the return type of the CUDA expression (function call) and issues a warning if
+ * it does not equal cudaSuccess.
+ *
+ * Example usage:
+ * @code{.cpp}
+ * #include <opm/simulators/linalg/cuistl/detail/cuda_safe_call.hpp>
+ * #include <cuda_runtime.h>
+ *
+ * void some_function() {
+ *     void* somePointer;
+ *     OPM_CUDA_WARN_IF_ERROR(cudaMalloc(&somePointer, 1));
+ * }
+ * @endcode
+ *
+ * @note Prefer the cudaSafeCall/OPM_CUDA_SAFE_CALL counterpart unless you really don't want to throw an exception.
+ */
+#define OPM_CUDA_WARN_IF_ERROR(expression)                                                                             \
+    ::Opm::cuistl::detail::cudaWarnIfError(expression, #expression, __FILE__, __func__, __LINE__)
+
 #endif