PaddlePaddle · HydrogenSulfate · May 24, 2024 · May 19, 2024 · May 19, 2024 · May 20, 2024
@@ -29,6 +29,7 @@
 - maximum
 - minimum
 - prod
+- cumprod
 - roll
 - scatter
 - scatter_nd_add

@@ -1071,6 +1071,31 @@ void gather_nd_grad(const Tensor& x,
   }
 }
 
+template <typename T>
+void cumprod_grad(const Tensor& x,
+                  const Tensor& out,
+                  const Tensor& out_grad,
+                  int dim,
+                  bool exclusive,
+                  bool reverse,
+                  Tensor* x_grad) {
+  if (x_grad) {
+    // dx = cumsum(out * out_grad, dim, false, exclusive, !reverse) / x
+    std::vector<int64_t> x_dim = common::vectorize<int64_t>(x.dims());
+    auto zero_tensor = full<T>(x_dim, 0.0, x.dtype());
+    auto zero_mask = cast<T>(equal<T>(x, zero_tensor), x.dtype());
+    auto common_dx =
+        cumsum<T>(out * out_grad, dim, false, exclusive, !reverse) / x;
+    auto ones_tensor = full<T>(x_dim, 1.0, x.dtype());
+    auto replace_one = (1 - zero_mask) * x + zero_mask * ones_tensor;
+    auto cumprod_recompute = cumprod<T>(replace_one, dim, exclusive, reverse);
+    auto zeros_dx = cumsum<T>(
+        cumprod_recompute * out_grad, dim, false, exclusive, !reverse);
+    auto x_grad_res = (1 - zero_mask) * common_dx + zero_mask * zeros_dx;
+    set_output<T>(x_grad_res, x_grad);
+  }
+}
+
 template <typename T>
 void prod_grad(const Tensor& x,
                const Tensor& out,

diff --git a/paddle/fluid/primitive/rule/vjp/details.h b/paddle/fluid/primitive/rule/vjp/details.h
@@ -59,6 +59,31 @@ void cumsum_grad(const Tensor& x,
   }
 }
 
+template <typename T>
+void cumprod_grad(const Tensor& x,
+                  const Tensor& out,
+                  const Tensor& out_grad,
+                  int dim,
+                  bool exclusive,
+                  bool reverse,
+                  Tensor* x_grad) {
+  if (x_grad) {
+    // dx = cumsum(out * out_grad, dim, false, exclusive, !reverse) / x
+    std::vector<int64_t> x_dim = common::vectorize<int64_t>(x.dims());
+    auto zero_tensor = full<T>(x_dim, 0.0, x.dtype());
+    auto zero_mask = cast<T>(equal<T>(x, zero_tensor), x.dtype());
+    auto common_dx =
+        cumsum<T>(out * out_grad, dim, false, exclusive, !reverse) / x;
+    auto ones_tensor = full<T>(x_dim, 1.0, x.dtype());
+    auto replace_one = (1 - zero_mask) * x + zero_mask * ones_tensor;
-    auto ones_tensor = full<T>(x_dim, 1.0, x.dtype());
-    auto replace_one = (1 - zero_mask) * x + zero_mask * ones_tensor;
+    auto replace_one = (1 - zero_mask) * x + zero_mask;
-    auto ones_tensor = full<T>(x_dim, 1.0, x.dtype());
-    auto replace_one = (1 - zero_mask) * x + zero_mask * ones_tensor;
+    auto replace_one = (1 - zero_mask) * x + zero_mask;
+    auto cumprod_recompute = cumprod<T>(replace_one, dim, exclusive, reverse);
+    auto zeros_dx = cumsum<T>(
+        cumprod_recompute * out_grad, dim, false, exclusive, !reverse);
+    auto x_grad_res = (1 - zero_mask) * common_dx + zero_mask * zeros_dx;
+    set_output<T>(x_grad_res, x_grad);
+  }
+}
+
 template <typename T>
 void divide_grad(const Tensor& x,
                  const Tensor& y,

diff --git a/paddle/phi/api/yaml/backward.yaml b/paddle/phi/api/yaml/backward.yaml
@@ -572,6 +572,7 @@
     param: [x]
   kernel :
     func : cumprod_grad
+  composite: cumprod_grad(x, out, out_grad, dim, exclusive, reverse, x_grad)
 
 - backward_op : cumsum_grad
   forward : cumsum(Tensor x, Scalar axis=-1, bool flatten=false, bool exclusive=false, bool reverse=false) -> Tensor(out)

diff --git a/test/prim/prim/vjp/eager/test_comp_eager_cumprod_grad.py b/test/prim/prim/vjp/eager/test_comp_eager_cumprod_grad.py
@@ -0,0 +1,76 @@
+# Copyright (c) 2022 PaddlePaddle Authors. All Rights Reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import unittest
+
+import numpy as np
+import parameterized as param
+
+import paddle
+from paddle.base import core
+
+
+@param.parameterized_class(
+    ('primal', 'dtype'),
+    [
+        (
+            np.random.rand(2, 3, 4),
+            np.float32,
+        ),
+        (
+            np.random.rand(2, 3, 3, 4),
+            np.float32,
+        ),
+    ],
+)
+class TestCumprodGradComp(unittest.TestCase):
+    @classmethod
+    def setUpClass(cls):
+        cls.primal = cls.primal.astype(cls.dtype)
+
+    def test_cumprod_grad_comp(self):
+        def actual(primal, dim):
+            paddle.disable_static()
+            core.set_prim_eager_enabled(True)
+            x = paddle.to_tensor(primal, dtype='float32', stop_gradient=False)
+            x.stop_gradient = False
+            y = paddle.cumprod(x, dim=dim)
+            x_cotangent = paddle.grad(
+                y, x, create_graph=True, retain_graph=True
+            )
+            return x_cotangent[0]
+
+        def desired(primal, dim):
+            paddle.disable_static()
+            core.set_prim_eager_enabled(False)
+            x = paddle.to_tensor(primal, dtype='float32', stop_gradient=False)
+            x.stop_gradient = False
+            y = paddle.cumprod(x, dim=dim)
+            x_cotangent = paddle.grad(
+                y, x, create_graph=False, retain_graph=True
+            )
+            return x_cotangent[0]
+
+        for i in range(len(self.primal.shape)):
+            np.testing.assert_allclose(
+                actual=actual(self.primal, i),
+                desired=desired(self.primal, i),
+                rtol=1e-6,
+                atol=0,
+            )
+        core.set_prim_eager_enabled(False)
+
+
+if __name__ == '__main__':
+    unittest.main()
diff --git a/test/prim/prim/vjp/static/test_comp_cumprod_grad.py b/test/prim/prim/vjp/static/test_comp_cumprod_grad.py
@@ -0,0 +1,123 @@
+# Copyright (c) 2022 PaddlePaddle Authors. All Rights Reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import unittest
+
+from paddle.base import core
+
+core._set_prim_backward_enabled(True)
+
+import numpy as np
+import parameterized as param
+
+import paddle
+
+
+def apply_to_static(net, use_cinn):
+    build_strategy = paddle.static.BuildStrategy()
+    build_strategy.build_cinn_pass = use_cinn
+    return paddle.jit.to_static(
+        net, build_strategy=build_strategy, full_graph=True
+    )
+
+
+class PrimeNet(paddle.nn.Layer):
+    def __init__(self):
+        super().__init__()
+        self.fc = paddle.nn.Linear(4, 4)
+
+    def forward(self, x):
+        tmp = self.fc(x)
+        out = paddle.cumprod(tmp, -1)
+        return out
+
+
+@param.parameterized_class(
+    ('primal', 'cotangent', 'dtype'),
+    [
+        (np.random.rand(10, 10), np.random.rand(10, 10), np.float32),
+    ],
+)
+class TestCumprodGradComp(unittest.TestCase):
+    @classmethod
+    def setUpClass(cls):
+        cls.primal = cls.primal.astype(cls.dtype)
+        cls.cotangent = cls.cotangent.astype(cls.dtype)
+
+    def train(self, use_prim, use_cinn):
+        paddle.seed(2022)
+        self.x = paddle.randn([2, 4])
+        self.x.stop_gradient = False
+        net = PrimeNet()
+        core._set_prim_backward_enabled(use_prim)
+        net = apply_to_static(net, use_cinn)
+        out = net(self.x)
+        res = paddle.autograd.grad(out, [self.x])
+
+        return res
+
+    def test_tanh_grad_comp(self):
+        paddle.enable_static()
+
+        def actual(primal, cotangent, dim):
+            core._set_prim_backward_enabled(True)
+            mp, sp = paddle.static.Program(), paddle.static.Program()
+            with paddle.static.program_guard(mp, sp):
+                x = paddle.static.data('primal', primal.shape, primal.dtype)
+                x.stop_gradient = False
+                v = paddle.static.data(
+                    'cotangent', cotangent.shape, cotangent.dtype
+                )
+                y = paddle.cumprod(x, dim)
+                x_cotangent = paddle.static.gradients(y, x, v)
+            exe = paddle.static.Executor()
+            exe.run(sp)
+            return exe.run(
+                program=mp,
+                feed={'primal': primal, 'cotangent': cotangent},
+                fetch_list=[x_cotangent[0]],
+            )[0]
+
+        def desired(primal, cotangent, dim):
+            core._set_prim_backward_enabled(False)
+            mp, sp = paddle.static.Program(), paddle.static.Program()
+            with paddle.static.program_guard(mp, sp):
+                x = paddle.static.data('primal', primal.shape, primal.dtype)
+                x.stop_gradient = False
+                v = paddle.static.data(
+                    'cotangent', cotangent.shape, cotangent.dtype
+                )
+                y = paddle.cumprod(x, dim)
+                x_cotangent = paddle.static.gradients(y, x, v)
+            exe = paddle.static.Executor()
+            exe.run(sp)
+            return exe.run(
+                program=mp,
+                feed={'primal': primal, 'cotangent': cotangent},
+                fetch_list=[x_cotangent[0]],
+            )[0]
+
+        for i in range(len(self.primal.shape)):
+            np.testing.assert_allclose(
+                actual=actual(self.primal, self.cotangent, i),
+                desired=desired(self.primal, self.cotangent, i),
+                rtol=1e-6,
+                atol=0,
+            )
+        core._set_prim_backward_enabled(False)
+        paddle.disable_static()
+
+
+if __name__ == '__main__':
+    unittest.main()