exoplanet-dev · dfm · Sep 16, 2020 · Sep 16, 2020 · Oct 14, 2020 · Oct 14, 2020
diff --git a/.github/workflows/python.yml b/.github/workflows/python.yml
@@ -79,6 +79,19 @@ jobs:
           conda install -q numpy scipy theano mkl-service
           python -m pip install -U pip
           python -m pip install --use-feature=2020-resolver -e ".[test,theano]"
+      - name: Get theano compiledir
+        id: compiledir
+        shell: bash -l {0}
+        run: |
+          python -c "import theano; print('::set-output name=compiledir::' + theano.config.compiledir.split('/')[-1])"
+      - name: "Cache ~/.theano"
+        uses: actions/cache@v2
+        with:
+          path: ~/.theano
+          key: theano-${{ steps.compiledir.outputs.compiledir }}-${{ hashFiles('python/test/theano/*.py') }}
+          restore-keys: |
+            theano-${{ steps.compiledir.outputs.compiledir }}-
+            theano-
       - name: Run the unit tests
         shell: bash -l {0}
         run: python -m pytest --cov celerite2 python/test/theano

diff --git a/.github/workflows/tutorials.yml b/.github/workflows/tutorials.yml
@@ -29,6 +29,20 @@ jobs:
           python -m pip install -U pip
           python -m pip install --use-feature=2020-resolver ".[tutorials]"
 
+      - name: Get theano compiledir
+        id: compiledir
+        run: |
+          python -c "import theano; print('::set-output name=compiledir::' + theano.config.compiledir.split('/')[-1])"
+
+      - name: "Cache ~/.theano"
+        uses: actions/cache@v2
+        with:
+          path: ~/.theano
+          key: tutorials-${{ steps.compiledir.outputs.compiledir }}-${{ hashFiles('docs/tutorials/*.py') }}
+          restore-keys: |
+            tutorials-${{ steps.compiledir.outputs.compiledir }}-
+            tutorials-
+
       - name: Execute the notebooks
         run: |
           jupytext --to ipynb --execute docs/tutorials/*.py

diff --git a/docs/.gitignore b/docs/.gitignore
@@ -1,2 +1,3 @@
 _build
 c++
+tutorials/*.png
diff --git a/docs/api/python.rst b/docs/api/python.rst
@@ -72,3 +72,15 @@ recommended unless you're confident that you know what you're doing.
 .. autoclass:: celerite2.terms.RealTerm
 .. autoclass:: celerite2.terms.ComplexTerm
 .. autoclass:: celerite2.terms.OriginalCeleriteTerm
+
+Multivariate models
+-------------------
+
+The original *celerite* algorithm was only defined for one dimensional inputs,
+but this was generalized by `Gordon et al. (2020)
+<https://arxiv.org/abs/2007.05799>`_ to support multivariate inputs on tensor
+product grids with separable kernels. In this case, the covariance matrix is
+given by a Kronecker product. These models are now available in *celerite2*
+using the following:
+
+.. autoclass:: celerite2.kron.KronTerm
diff --git a/docs/index.rst b/docs/index.rst
@@ -36,6 +36,7 @@ be a good choice.
    :caption: Tutorials
 
    tutorials/first.ipynb
+   tutorials/kron.ipynb
 
 .. toctree::
    :maxdepth: 2

diff --git a/docs/tutorials/first.py b/docs/tutorials/first.py
@@ -36,7 +36,10 @@
 np.random.seed(42)
 
 t = np.sort(
-    np.append(np.random.uniform(0, 3.8, 57), np.random.uniform(5.5, 10, 68),)
+    np.append(
+        np.random.uniform(0, 3.8, 57),
+        np.random.uniform(5.5, 10, 68),
+    )
 )  # The input coordinates must be sorted
 yerr = np.random.uniform(0.08, 0.22, len(t))
 y = (

diff --git a/docs/tutorials/kron.py b/docs/tutorials/kron.py
@@ -0,0 +1,141 @@
+# -*- coding: utf-8 -*-
+# ---
+# jupyter:
+#   jupytext:
+#     text_representation:
+#       extension: .py
+#       format_name: light
+#       format_version: '1.5'
+#       jupytext_version: 1.5.2
+#   kernelspec:
+#     display_name: Python 3
+#     language: python
+#     name: python3
+# ---
+
+# + nbsphinx="hidden"
+# %matplotlib inline
+
+# + nbsphinx="hidden"
+# %run notebook_setup
+# -
+
+# # Multivariate models
+#
+# The original *celerite* package only supported one-dimensional data (like time series), but [Gordon et al. (2020)](https://arxiv.org/abs/2007.05799) generalized the method to multivariate data on a tensor product grid.
+# This has been implmented in *celerite2* so "rectangular" data are now supported.
+# The main application discussed by [Gordon et al. (2020)](https://arxiv.org/abs/2007.05799) was multiwavelength observations of transiting exoplanets, but this can be applicable to many other problems with the following structure:
+#
+# 1. The rectagular data must be fully filled: you must have observations in every band at every time. We've developed a method to handle missing data and that will be included in a future release.
+# 2. The covariance matrix must be seperable with the form `k({x, y}_n, {x, y}_m) = k1(x_n, x_m) * k2(y_n, y_m)`, where `x` (a scalar) indexes the "longest" one-dimensional axis of the data (for example, time) and `y` (optionally a vector) indexes the narrower axis of the data (for example, wavelength). To apply *celerite*, we must make the further assumption that `k1(x_n, x_m)` is a standard *celerite* kernel, but no limitations are placed on the form of `k2(y_n, y_m)`.
+#
+# The implementation of this method in *celerite2* comes with two forms for the kernel:
+#
+# 1. `kron.KronTerm`: A general form of the model where `k2(y_n, y_m)` is specified as a full-rank `M x M` matrix called `R`, where `M` is the size of the `y` dimension. The computational cost of evaluating this model scales as `O(N * J^2 * M^3)` where `N` is the size of the `x` dimension and `J` is the rank of the *celerite* term describing `k1(x_n, x_m)`.
+# 2. `kron.LowRankKronTerm`: A more computationally efficient method where
+
+# +
+import numpy as np
+import matplotlib.pyplot as plt
+
+import celerite2
+
+N = 200
+M = 5
+lam = np.linspace(0, 3, M)
+
+np.random.seed(59302)
+t = np.append(
+    np.sort(np.random.uniform(0, 4, N // 2)),
+    np.sort(np.random.uniform(6, 10, N - N // 2)),
+)
+yerr = np.random.uniform(1e-1, 2e-1, (N, M))
+
+rho_true = 4.5
+R_true = 0.5 * np.exp(-0.5 * (lam[:, None] - lam[None, :]) ** 2)
+kernel = celerite2.kron.KronTerm(
+    celerite2.terms.SHOTerm(sigma=1.0, rho=rho_true, Q=3.0), R=R_true
+)
+gp = celerite2.GaussianProcess(kernel, t=t, yerr=yerr)
+y = gp.sample()
+
+plt.yticks([])
+for m in range(M):
+    plt.axhline(2 * m, color="k", lw=0.5)
+plt.plot(t, y + 2 * np.arange(M), ".")
+plt.ylim(-2, 2 * M)
+plt.xlim(-1, 11)
+plt.xlabel("x")
+_ = plt.ylabel("y (with offsets)")
+
+# +
+import pymc3 as pm
+import pymc3_ext as pmx
+import celerite2.theano as cl2
+
+with pm.Model() as model:
+
+    rho = pm.Lognormal("rho", mu=np.log(5.0), sigma=5.0)
+    chol = pm.LKJCholeskyCov(
+        "chol",
+        eta=10.0,
+        n=M,
+        sd_dist=pm.Exponential.dist(0.01),
+        compute_corr=True,
+    )[0]
+    R = pm.Deterministic("R", pm.math.dot(chol, chol.T))
+
+    kernel = cl2.kron.KronTerm(
+        cl2.terms.SHOTerm(sigma=1.0, rho=rho, Q=3.0), R=R
+    )
+    gp = cl2.GaussianProcess(kernel, t=t, yerr=yerr)
+    gp.marginal("obs", observed=y)
+
+    soln = pmx.optimize()
+
+# +
+t_pred = np.linspace(-1, 11, 1000)
+with model:
+    mu, var = pmx.eval_in_model(gp.predict(y, t=t_pred, return_var=True), soln)
+
+plt.yticks([])
+for m in range(M):
+    plt.axhline(2 * m, color="k", lw=0.5)
+    plt.plot(t, y[:, m] + 2 * m, ".", color=f"C{m}")
+    plt.fill_between(
+        t_pred,
+        mu[:, m] - np.sqrt(var[:, m]) + 2 * m,
+        mu[:, m] + np.sqrt(var[:, m]) + 2 * m,
+        color=f"C{m}",
+        alpha=0.5,
+    )
+    plt.plot(t_pred, mu[:, m] + 2 * m, color=f"C{m}")
+
+plt.ylim(-2, 2 * M)
+plt.xlim(-1, 11)
+plt.xlabel("x")
+_ = plt.ylabel("y (with offsets)")
+# -
+
+with model:
+    trace = pm.sample(
+        tune=2000, draws=2000, target_accept=0.9, init="adapt_full"
+    )
+
+plt.hist(trace["rho"], 50, histtype="step", color="k")
+plt.axvline(rho_true)
+plt.yticks([])
+plt.xlabel(r"$\rho$")
+plt.ylabel(r"$p(\rho)$")
+
+for m in range(M):
+    plt.errorbar(
+        np.arange(M),
+        np.mean(trace["R"][:, m, :], axis=0) + m,
+        yerr=np.std(trace["R"][:, m, :], axis=0),
+        color=f"C{m}",
+    )
+    plt.plot(np.arange(M), R_true[m] + m, ":", color=f"C{m}")
+plt.yticks([])
+plt.xlabel("band index")
+_ = plt.ylabel("covariance (with offsets)")
diff --git a/python/celerite2/__init__.py b/python/celerite2/__init__.py
@@ -1,8 +1,8 @@
 # -*- coding: utf-8 -*-
 
-__all__ = ["__version__", "terms", "GaussianProcess"]
+__all__ = ["__version__", "terms", "kron", "GaussianProcess"]
 
-from . import terms
+from . import kron, terms
 from .celerite2 import GaussianProcess
 from .celerite2_version import __version__