Merge branch 'main' into howto_docs

felipeangelimvieira · Dec 15, 2024 · 2ccc4b2 · 2ccc4b2
2 parents 540c1b1 + a4aa653
commit 2ccc4b2
Show file tree

Hide file tree

Showing 6 changed files with 93 additions and 65 deletions.
diff --git a/docs/reference/core/inference_engine.md → docs/reference/inference_engine.md b/docs/reference/core/inference_engine.md → docs/reference/inference_engine.md
diff --git a/docs/reference/optimizers.md b/docs/reference/optimizers.md
@@ -0,0 +1,4 @@
+# MAP Optimizers and solvers
+
+::: prophetverse.engine.optimizer
+
diff --git a/docs/reference/trends.md b/docs/reference/trends.md
@@ -0,0 +1,4 @@
+# Trend models
+
+::: prophetverse.effects.trend
+
diff --git a/docs/the-theory.md b/docs/the-theory.md
@@ -44,11 +44,12 @@ y_{mean} &= \sum\limits_{i=1}^n f_i(x_i(t), \{f_j(x_j)\}_{j<i}) \\
          &= f_1(x_1(t)) + f_2(x_2(t), f_1(x_1(t))) + \ldots + f_n(t, \{f_j(x_j)\}_{j<n})
 \end{align}
 
-where \
-- the first component $f_1$ accounts for the trend
-- the second component $f_2$ is other regression component that could interact with the trend $f_1$
-- the third component $f_3$ is another regression component that could interact with $f_1$, and $f_2$ 
-- And the next components can always interact with the previously defined components.
+where 
+
+* the first component $f_1$ accounts for the trend
+* the second component $f_2$ is other regression component that could interact with the trend $f_1$
+* the third component $f_3$ is another regression component that could interact with $f_1$, and $f_2$ 
+* And the next components can always interact with the previously defined components.
 
 
 This definition superseeds the
@@ -70,7 +71,7 @@ likelihood, $\phi$ is the identity function, but for Gamma and Negative Binomial
 
 $$
 \phi(k) = \begin{cases}
-k & \text{if } k > 10^5 \\
+k & \text{if } k > z \\
 z\exp(k-z) & \text{if } k \leq z
 \end{cases}
 $$
@@ -199,6 +200,10 @@ $$
 Here, `P` is the period (e.g., 365.25 for yearly seasonality), and $a_k$ and $b_k$ are the Fourier coefficients that the model estimates. The choice of `K` depends on the granularity of the seasonal changes one wishes to capture.
 A Normal prior is placed on the coefficients, $a_k, b_k \sim \mathcal{N}(0, \sigma_s)$, where $\sigma_s$ is a hyperparameter.
 
+See [`LinearFourierSeasonality`](/reference/effects/#prophetverse.effects.LinearFourierSeasonality) for more details on the hyperparameters of the effect
+
+
+
 
 ### Matrix Formulation of Fourier Series
 

diff --git a/mkdocs.yml b/mkdocs.yml
@@ -49,7 +49,7 @@ nav:
 
   #- Marketing Mix Modeling 🚀:
   #    - Lift test calibration: examples/custom-effect.ipynb
-  - Understand Prophetverse:
+  - Mathematical formulation 📖:
     - Theory: the-theory.md
 
   - Reference:
@@ -59,9 +59,10 @@ nav:
         - ProphetGamma: reference/sktime/prophet_gamma.md
         - ProphetNegBinomial: reference/sktime/prophet_negbin.md
         - Hierarchical Prophet: reference/sktime/hierarchical_prophet.md
-      - Core:
-        - Inference Engine: reference/core/inference_engine.md
+      - Inference Engines: reference/inference_engine.md
+      - Optimizers: reference/optimizers.md
       - Exogenous Effects: reference/effects.md
+      - Trend models: reference/trends.md
   - Development:
     - Contributing to Prophetverse:  development/development-guide.md
   - Deprecation Policy: deprecation.md

diff --git a/src/prophetverse/engine/optimizer/optimizer.py b/src/prophetverse/engine/optimizer/optimizer.py
@@ -20,6 +20,7 @@
     "BaseOptimizer",
     "AdamOptimizer",
     "CosineScheduleAdamOptimizer",
+    "LBFGSSolver",
 ]
 
 
@@ -64,17 +65,15 @@ class AdamOptimizer(BaseOptimizer):
     Adam optimizer for NumPyro models.
 
     This class implements the Adam optimization algorithm.
+
+    Parameters
+    ----------
+    step_size : float, optional
+        The step size (learning rate) for the optimizer. Default is 0.001.
     """
 
     def __init__(self, step_size=0.001):
-        """
-        Initialize the AdamOptimizer.
-
-        Parameters
-        ----------
-        step_size : float, optional
-            The step size (learning rate) for the optimizer. Default is 0.001.
-        """
+        """Initialize the AdamOptimizer."""
         self.step_size = step_size
         super().__init__()
 
@@ -96,23 +95,20 @@ class CosineScheduleAdamOptimizer(BaseOptimizer):
 
     This optimizer combines the Adam optimizer with a cosine decay schedule
     for the learning rate.
+
+    Parameters
+    ----------
+    init_value : float, optional
+        Initial learning rate. Default is 0.001.
+    decay_steps : int, optional
+        Number of steps over which the learning rate decays. Default is 100_000.
+    alpha : float, optional
+        Final multiplier for the learning rate. Default is 0.0.
+    exponent : int, optional
+        Exponent for the cosine decay schedule. Default is 1.
     """
 
     def __init__(self, init_value=0.001, decay_steps=100_000, alpha=0.0, exponent=1):
-        """
-        Initialize the CosineScheduleAdamOptimizer.
-
-        Parameters
-        ----------
-        init_value : float, optional
-            Initial learning rate. Default is 0.001.
-        decay_steps : int, optional
-            Number of steps over which the learning rate decays. Default is 100_000.
-        alpha : float, optional
-            Final multiplier for the learning rate. Default is 0.0.
-        exponent : int, optional
-            Exponent for the cosine decay schedule. Default is 1.
-        """
         self.init_value = init_value
         self.decay_steps = decay_steps
         self.alpha = alpha
@@ -145,30 +141,49 @@ def create_optimizer(self) -> _NumPyroOptim:
         return opt
 
 
-class BFGSOptimizer(BaseOptimizer):
-
-    def __init__(self, learning_rate=1e-3, memory_size=10, scale_init_precond=True):
-
-        self.learning_rate = learning_rate
-        self.memory_size = memory_size
-        self.scale_init_precond = scale_init_precond
-        super().__init__()
-
-    def create_optimizer(self):
-
-        # Linesearch
-        linesearch = optax.scale_by_lbfgs(
-            memory_size=self.memory_size,
-            scale_init_precond=self.scale_init_precond,
-        )
-
-        # Optimizer
-        opt = optax.chain(linesearch, optax.scale(-1.0))
-
-        return numpyro.optim.optax_to_numpyro(opt)
-
-
 class LBFGSSolver(BaseOptimizer):
+    """
+    L-BFGS solver.
+
+    This solver is more practical than other optimizers since it usually does not
+    require tuning of hyperparameters to get better estimates.
+
+    If your model does not converge with the default hyperparameters, you can try
+    increasing `memory_size`, `max_linesearch_steps`, or setting a larger number
+    of steps.
+
+    Parameters
+    ----------
+    gtol : float, default=1e-6
+        Gradient tolerance for stopping criterion.
+    tol : float, default=1e-6
+        Function value tolerance for stopping criterion.
+    learning_rate : float, default=1e-3
+        Initial learning rate.
+    memory_size : int, default=10
+        Memory size for L-BFGS updates.
+    scale_init_precond : bool, default=True
+        Whether to scale the initial preconditioner.
+    max_linesearch_steps : int, default=20
+        Maximum number of line search steps.
+    initial_guess_strategy : str, default="one"
+        Strategy for the initial line search step size guess.
+    max_learning_rate : float, optional
+        Maximum allowed learning rate during line search.
+    linesearch_tol : float, default=0
+        Tolerance parameter for line search.
+    increase_factor : float, default=2
+        Factor by which to increase step size during line search when conditions are
+        met.
+    slope_rtol : float, default=0.0001
+        Relative tolerance for slope in the line search.
+    curv_rtol : float, default=0.9
+        Curvature condition tolerance for line search.
+    approx_dec_rtol : float, default=0.000001
+        Approximate decrease tolerance for line search.
+    stepsize_precision : float, default=1e5
+        Stepsize precision tolerance.
+    """
 
     _tags = {
         "is_solver": True,
@@ -214,12 +229,13 @@ def __init__(
         self.max_iter = 1000
 
     def set_max_iter(self, max_iter: int):
-
+        """Set the maximum number of iterations for the solver."""
         new_obj = self.clone()
         new_obj.max_iter = max_iter
         return new_obj
 
     def create_optimizer(self):
+        """Create and return a NumPyro L-BFGS solver instance."""
         return LBFGS(
             max_iter=self.max_iter,
             tol=self.tol,
@@ -245,21 +261,19 @@ class _LegacyNumpyroOptimizer(BaseOptimizer):
     Legacy optimizer.
 
     This class allows the use of any optimizer available in numpyro.optim by name.
+
+    Parameters
+    ----------
+    optimizer_name : str, optional
+        The name of the optimizer to use from numpyro.optim. Default is "Adam".
+    optimizer_kwargs : dict, optional
+        Keyword arguments to pass to the optimizer. Default is None.
     """
 
     def __init__(
         self, optimizer_name: str = "Adam", optimizer_kwargs: Optional[dict] = None
     ):
-        """
-        Initialize the _LegacyNumpyroOptimizer.
-
-        Parameters
-        ----------
-        optimizer_name : str, optional
-            The name of the optimizer to use from numpyro.optim. Default is "Adam".
-        optimizer_kwargs : dict, optional
-            Keyword arguments to pass to the optimizer. Default is None.
-        """
+        """Initialize the _LegacyNumpyroOptimizer."""
         self.optimizer_name = optimizer_name
         self.optimizer_kwargs = optimizer_kwargs
         super().__init__()
Original file line number	Diff line number	Diff line change
		@@ -0,0 +1,4 @@
		# MAP Optimizers and solvers

		::: prophetverse.engine.optimizer