fix__linalg_solve

fxyfxy777 · fxyfxy777 · commit 4bf1df1ca90c · 2025-07-29T17:22:27.000+08:00
diff --git a/paddle/phi/kernels/funcs/matrix_solve.cu b/paddle/phi/kernels/funcs/matrix_solve.cu
@@ -18,6 +18,7 @@ limitations under the License. */
 #include "paddle/phi/kernels/funcs/blas/blas.h"
 #include "paddle/phi/kernels/funcs/math_function.h"
 #include "paddle/phi/kernels/funcs/scatter.cu.h"
+#include "paddle/phi/backends/gpu/cuda/cudnn_workspace_helper.h"
 
 namespace phi {
 namespace funcs {
@@ -161,11 +162,14 @@ void MatrixSolveFunctor<Context, T>::operator()(const Context& dev_ctx,
   int n = a_dims[a_rank - 1];
   int lda = n;
   int64_t batch_size = a_rank > 2 ? a.numel() / (n * n) : 1;
+  CUDNN_ENFORCE_TENSOR_SIZE_SUPPORTED(a);
+
 
   const auto& b_dims = b.dims();
   const int b_rank = b_dims.size();
   int nrhs = b_dims[b_rank - 1];
   int ldb = n;
+  CUDNN_ENFORCE_TENSOR_SIZE_SUPPORTED(b);
 
   // 1. Copy input A to a temporary tensor tmp_a for LU factorization.
   DenseTensor tmp_a(a.dtype());