add eager and static backend for warp lower level api

PaddlePaddle · Jul 28, 2023 · 4ee2d44 · 4ee2d44
1 parent 690a0b9
commit 4ee2d44
Show file tree

Hide file tree

Showing 6 changed files with 173 additions and 132 deletions.
diff --git a/paddle/primitive/CMakeLists.txt b/paddle/primitive/CMakeLists.txt
@@ -1,3 +1,3 @@
-add_subdirectory(primitive)
+add_subdirectory(backend)
 add_subdirectory(rule)
 add_subdirectory(type)
diff --git a/paddle/primitive/primitive/CMakeLists.txt → paddle/primitive/backend/CMakeLists.txt b/paddle/primitive/primitive/CMakeLists.txt → paddle/primitive/backend/CMakeLists.txt
@@ -1,10 +1,10 @@
 if(NOT (NOT WITH_PYTHON AND ON_INFER))
   cc_library(
-    experimental_eager_primitive
-    SRCS eager_primitive.cc
+    experimental_eager_primitive_backend
+    SRCS eager_backend.cc
     DEPS final_dygraph_function eager_utils)
 endif()
 cc_library(
-  experimental_static_primitive
-  SRCS static_primitive.cc
+  experimental_static_primitive_backend
+  SRCS static_backend.cc
   DEPS proto_desc static_utils)
diff --git a/paddle/primitive/backend/backend.h b/paddle/primitive/backend/backend.h
@@ -0,0 +1,157 @@
+// Copyright (c) 2023 PaddlePaddle Authors. All Rights Reserved.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+#pragma once
+
+#include <string>
+#include <vector>
+
+#include "paddle/fluid/framework/op_proto_maker.h"
+#include "paddle/fluid/operators/common_infer_shape_functions.h"
+#include "paddle/fluid/prim/api/generated_prim/prim_generated_api.h"
+#include "paddle/phi/common/data_type.h"
+#include "paddle/phi/common/int_array.h"
+#include "paddle/phi/common/place.h"
+#include "paddle/phi/common/scalar.h"
+#include "paddle/phi/core/ddim.h"
+#include "paddle/phi/kernels/funcs/blas/blas.h"
+#include "paddle/utils/optional.h"
+
+namespace paddle {
+namespace primitive {
+namespace backend {
+namespace experimental {
+
+using Tensor = paddle::Tensor;
+
+template <typename T>
+Tensor tanh(const Tensor& x);
+
+template <typename T>
+Tensor empty(const paddle::experimental::IntArray& shape,
+             phi::DataType dype,
+             const paddle::Place& place);
+
+template <typename T>
+Tensor empty_like(const Tensor& x,
+                  phi::DataType dtype,
+                  const paddle::Place& place);
+
+// copy tensor for output ptr, in static need use assigh op
+template <typename T>
+void by_pass(const Tensor& x, Tensor* out);
+
+// set output ptr impl with tmp ptr impl,in dygraph OutGradMeta should be set
+template <typename T>
+void set_output(const Tensor& x_tmp, Tensor* x);
+
+// These method don't need to be specified
+static phi::DDim get_reduce_dims_from_out(const phi::DDim& dout_dims,
+                                          const phi::DDim& in_dims) {
+  std::vector<int64_t> result;
+  int bat = dout_dims.size() - in_dims.size();
+  for (int i = 0; i < bat; ++i) {
+    result.push_back(i);
+  }
+  for (int i = 0; i < in_dims.size(); ++i) {
+    if (in_dims[i] == 1) {
+      result.push_back(i + bat);
+    } else {
+      PADDLE_ENFORCE_EQ(
+          in_dims[i],
+          dout_dims[i + bat],
+          platform::errors::InvalidArgument(
+              "ReduceDims dimension mismatch. Operands could "
+              "not be broadcast together with the shape of dout = [%s] and "
+              "the shape of in_dims = [%s]. Received [%d] in X is not equal to "
+              "[%d] in Y at i:%d.",
+              dout_dims,
+              in_dims,
+              dout_dims[i + bat],
+              in_dims[i],
+              i));
+    }
+  }
+  return phi::make_ddim(result);
+}
+
+static phi::DDim get_reduce_dims(const phi::DDim& x_dims,
+                                 const phi::DDim& y_dims) {
+  auto out_dims = paddle::operators::details::BroadcastTwoDims(x_dims, y_dims);
+  return get_reduce_dims_from_out(out_dims, x_dims);
+}
+
+static std::vector<int> get_reduce_dims(const Tensor& dx,
+                                        const int& dout_ndim,
+                                        const int& x_ndim,
+                                        std::vector<int64_t>* x_dims) {
+  // this branch for broadcast with 1dim, we make 1dim to 2dim which make
+  // ddout_ndim > dout_dim, but ddout_ndim just can be used when grad_out_grad
+  // != nullptr
+  if (dout_ndim < x_ndim) {
+    return std::vector<int>({});
+  }
+  const std::vector<std::int64_t> dx_dims = phi::vectorize(dx.dims());
+  std::vector<std::int64_t> broadcast_dims(dout_ndim);
+  std::fill(
+      broadcast_dims.data(), broadcast_dims.data() + dout_ndim - x_ndim, 1);
+  std::copy(x_dims->data(),
+            x_dims->data() + x_ndim,
+            broadcast_dims.data() + dout_ndim - x_ndim);
+  std::vector<int> reduce_dims;
+  for (int i = 0; i <= dout_ndim - 3; i++) {
+    if (dx_dims[i] != 1 && broadcast_dims[i] == 1) {
+      reduce_dims.push_back(i);
+    }
+  }
+  return reduce_dims;
+}
+
+// TODO(cxxly): Check and throws InvalidCastException when overflow.
+template <typename SRC_T, typename DST_T>
+static std::vector<DST_T> unsafe_vector_cast(const std::vector<SRC_T>& src) {
+  std::vector<DST_T> dst(src.begin(), src.end());
+  return dst;
+}
+
+// This fucction compute unsqueeze dims for reshape to replace unsqueeze.
+static std::vector<int64_t> get_unsqueeze_dims(
+    const Tensor& origin, const std::vector<int64_t>& axis) {
+  auto origin_dims = origin.shape();
+  auto total_shape_size = origin_dims.size() + axis.size();
+  std::vector<int64_t> result;
+  size_t j = 0, k = 0;
+  for (size_t i = 0; i < total_shape_size; ++i) {
+    if (j < axis.size() && axis[j] == int64_t(i)) {
+      result.push_back(1);
+      j++;
+    } else {
+      PADDLE_ENFORCE_LT(
+          k,
+          origin_dims.size(),
+          platform::errors::OutOfRange("Your index [%lu] exceeds the number of "
+                                       "elements in origin_dims[%lu].",
+                                       k,
+                                       origin_dims.size()));
+      result.push_back(origin_dims[k]);
+      k++;
+    }
+  }
+  return result;
+}
+
+}  // namespace experimental
+}  // namespace backend
+}  // namespace primitive
+}  // namespace paddle
diff --git a/...le/primitive/primitive/eager_primitive.cc → paddle/primitive/backend/eager_backend.cc b/...le/primitive/primitive/eager_primitive.cc → paddle/primitive/backend/eager_backend.cc
@@ -19,6 +19,7 @@
 
 namespace paddle {
 namespace primitive {
+namespace backend {
 namespace experimental {
 
 template <>
@@ -58,5 +59,6 @@ Tensor tanh<Tensor>(const Tensor& x) {
   return ::tanh_ad_func(x);
 }
 }  // namespace experimental
+}  // namespace backend
 }  // namespace primitive
 }  // namespace paddle
diff --git a/...e/primitive/primitive/static_primitive.cc → paddle/primitive/backend/static_backend.cc b/...e/primitive/primitive/static_primitive.cc → paddle/primitive/backend/static_backend.cc
@@ -39,8 +39,13 @@
 
 namespace paddle {
 namespace primitive {
+namespace backend {
 namespace experimental {
 
+using DescTensor = paddle::primitive::experimental::DescTensor;
+using StaticCompositeContext =
+    paddle::primitive::experimental::StaticCompositeContext;
+
 template <>
 Tensor empty<DescTensor>(const paddle::experimental::IntArray& shape,
                          phi::DataType dtype,
@@ -101,5 +106,6 @@ Tensor tanh<DescTensor>(const Tensor& x) {
 }
 
 }  // namespace experimental
+}  // namespace backend
 }  // namespace primitive
 }  // namespace paddle
diff --git a/paddle/primitive/primitive/primitive.h b/paddle/primitive/primitive/primitive.h
@@ -14,140 +14,16 @@
 
 #pragma once
 
-#include <string>
-#include <vector>
-
-#include "paddle/fluid/framework/op_proto_maker.h"
-#include "paddle/fluid/operators/common_infer_shape_functions.h"
-#include "paddle/fluid/prim/api/generated_prim/prim_generated_api.h"
-#include "paddle/phi/common/data_type.h"
-#include "paddle/phi/common/int_array.h"
-#include "paddle/phi/common/place.h"
-#include "paddle/phi/common/scalar.h"
-#include "paddle/phi/core/ddim.h"
-#include "paddle/phi/kernels/funcs/blas/blas.h"
-#include "paddle/utils/optional.h"
-
+#include "paddle/primitive/backend/backend.h"
 namespace paddle {
 namespace primitive {
 namespace experimental {
 
 using Tensor = paddle::Tensor;
 
 template <typename T>
-Tensor tanh(const Tensor& x);
-
-template <typename T>
-Tensor empty(const paddle::experimental::IntArray& shape,
-             phi::DataType dype,
-             const paddle::Place& place);
-
-template <typename T>
-Tensor empty_like(const Tensor& x,
-                  phi::DataType dtype,
-                  const paddle::Place& place);
-
-// copy tensor for output ptr, in static need use assigh op
-template <typename T>
-void by_pass(const Tensor& x, Tensor* out);
-
-// set output ptr impl with tmp ptr impl,in dygraph OutGradMeta should be set
-template <typename T>
-void set_output(const Tensor& x_tmp, Tensor* x);
-
-// These method don't need to be specified
-static phi::DDim get_reduce_dims_from_out(const phi::DDim& dout_dims,
-                                          const phi::DDim& in_dims) {
-  std::vector<int64_t> result;
-  int bat = dout_dims.size() - in_dims.size();
-  for (int i = 0; i < bat; ++i) {
-    result.push_back(i);
-  }
-  for (int i = 0; i < in_dims.size(); ++i) {
-    if (in_dims[i] == 1) {
-      result.push_back(i + bat);
-    } else {
-      PADDLE_ENFORCE_EQ(
-          in_dims[i],
-          dout_dims[i + bat],
-          platform::errors::InvalidArgument(
-              "ReduceDims dimension mismatch. Operands could "
-              "not be broadcast together with the shape of dout = [%s] and "
-              "the shape of in_dims = [%s]. Received [%d] in X is not equal to "
-              "[%d] in Y at i:%d.",
-              dout_dims,
-              in_dims,
-              dout_dims[i + bat],
-              in_dims[i],
-              i));
-    }
-  }
-  return phi::make_ddim(result);
-}
-
-static phi::DDim get_reduce_dims(const phi::DDim& x_dims,
-                                 const phi::DDim& y_dims) {
-  auto out_dims = paddle::operators::details::BroadcastTwoDims(x_dims, y_dims);
-  return get_reduce_dims_from_out(out_dims, x_dims);
-}
-
-static std::vector<int> get_reduce_dims(const Tensor& dx,
-                                        const int& dout_ndim,
-                                        const int& x_ndim,
-                                        std::vector<int64_t>* x_dims) {
-  // this branch for broadcast with 1dim, we make 1dim to 2dim which make
-  // ddout_ndim > dout_dim, but ddout_ndim just can be used when grad_out_grad
-  // != nullptr
-  if (dout_ndim < x_ndim) {
-    return std::vector<int>({});
-  }
-  const std::vector<std::int64_t> dx_dims = phi::vectorize(dx.dims());
-  std::vector<std::int64_t> broadcast_dims(dout_ndim);
-  std::fill(
-      broadcast_dims.data(), broadcast_dims.data() + dout_ndim - x_ndim, 1);
-  std::copy(x_dims->data(),
-            x_dims->data() + x_ndim,
-            broadcast_dims.data() + dout_ndim - x_ndim);
-  std::vector<int> reduce_dims;
-  for (int i = 0; i <= dout_ndim - 3; i++) {
-    if (dx_dims[i] != 1 && broadcast_dims[i] == 1) {
-      reduce_dims.push_back(i);
-    }
-  }
-  return reduce_dims;
-}
-
-// TODO(cxxly): Check and throws InvalidCastException when overflow.
-template <typename SRC_T, typename DST_T>
-static std::vector<DST_T> unsafe_vector_cast(const std::vector<SRC_T>& src) {
-  std::vector<DST_T> dst(src.begin(), src.end());
-  return dst;
-}
-
-// This fucction compute unsqueeze dims for reshape to replace unsqueeze.
-static std::vector<int64_t> get_unsqueeze_dims(
-    const Tensor& origin, const std::vector<int64_t>& axis) {
-  auto origin_dims = origin.shape();
-  auto total_shape_size = origin_dims.size() + axis.size();
-  std::vector<int64_t> result;
-  size_t j = 0, k = 0;
-  for (size_t i = 0; i < total_shape_size; ++i) {
-    if (j < axis.size() && axis[j] == int64_t(i)) {
-      result.push_back(1);
-      j++;
-    } else {
-      PADDLE_ENFORCE_LT(
-          k,
-          origin_dims.size(),
-          platform::errors::OutOfRange("Your index [%lu] exceeds the number of "
-                                       "elements in origin_dims[%lu].",
-                                       k,
-                                       origin_dims.size()));
-      result.push_back(origin_dims[k]);
-      k++;
-    }
-  }
-  return result;
+Tensor tanh(const Tensor& x) {
+  return backend::experimental::tanh<T>(x);
 }
 
 }  // namespace experimental