Special priors (#1939)

daniel-saunders-phil · web-flow · commit 6b30c10a3d7d · 2025-09-15T21:36:42.000+02:00
* add special priors file which includes the lognormalexp prior

* add tests

* change name of class from lognormalexp -&gt; lognormalpositiveparam

'

* add test for no dims

* expand tests to cover a few more cases.

* add special_priors to the index of the api docs.

* minor updates to doc string.
diff --git a/docs/source/api/index.md b/docs/source/api/index.md
@@ -21,5 +21,6 @@
   model_graph
   plot
   prior
+  special_priors
   utils
 ```
diff --git a/pymc_marketing/special_priors.py b/pymc_marketing/special_priors.py
@@ -0,0 +1,209 @@
+#   Copyright 2022 - 2025 The PyMC Labs Developers
+#
+#   Licensed under the Apache License, Version 2.0 (the "License");
+#   you may not use this file except in compliance with the License.
+#   You may obtain a copy of the License at
+#
+#       http://www.apache.org/licenses/LICENSE-2.0
+#
+#   Unless required by applicable law or agreed to in writing, software
+#   distributed under the License is distributed on an "AS IS" BASIS,
+#   WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+#   See the License for the specific language governing permissions and
+#   limitations under the License.
+"""
+Specialized priors that behave like the Prior class.
+
+The Prior class has certain design constraints that prevent it from
+covering all cases. So this module contains a collection of
+priors that do not inherit from the Prior class but have many
+of the same methods.
+"""
+
+import numpy as np
+import pymc as pm
+import pytensor.tensor as pt
+import xarray as xr
+from pymc_extras.deserialize import deserialize, register_deserialization
+from pymc_extras.prior import Prior, create_dim_handler, sample_prior
+from pytensor.tensor import TensorVariable
+
+
+class LogNormalPositiveParam:
+    """
+    A specialized implementation of a log normal distribution.
+
+    Like the LogNormal distribution, this distribution has support over the positive numbers.
+    However, unlike the lognormal, the parameters are also specified in the positive
+    domain.
+
+    The other advantage of this prior is in constructing hierarchical models. It allows users to toggle
+    between centered and non-centered parameterizations. This enables rapid iteration when searching
+    for a parameterization that samples efficiently.
+
+    Parameters
+    ----------
+    mu : Prior, float, int, array-like
+        The mean of the distribution.
+    sigma : Prior, float, int, array-like
+        The standard deviation of the distribution.
+    dims : tuple[str, ...], optional
+        The dimensions of the distribution, by default None.
+    centered : bool, optional
+        Whether the distribution is centered, by default True.
+
+    Examples
+    --------
+    Build a non-centered hierarchical model where information is shared across geos.
+
+    .. code-block:: python
+        from pymc_marketing.special_priors import LogNormalPositiveParam
+
+        normal = LogNormalPositiveParam(
+            mu=Prior("Gamma", mu=1.0, sigma=1.0),
+            sigma=Prior("HalfNormal", sigma=1.0),
+            dims=("geo",),
+            centered=False,
+        )
+    """
+
+    def __init__(self, dims: tuple | None = None, centered: bool = True, **parameters):
+        self.parameters = parameters
+        self.dims = dims
+        self.centered = centered
+
+        self._checks()
+
+    def _checks(self) -> None:
+        self._parameters_are_correct_set()
+
+    def _parameters_are_correct_set(self) -> None:
+        if set(self.parameters.keys()) != {"mu", "sigma"}:
+            raise ValueError("Parameters must be mu and sigma")
+
+    def _create_parameter(self, param, value, name):
+        if not hasattr(value, "create_variable"):
+            return value
+
+        child_name = f"{name}_{param}"
+        return self.dim_handler(value.create_variable(child_name), value.dims)
+
+    def create_variable(self, name: str) -> TensorVariable:
+        """Create a variable from the prior distribution."""
+        self.dim_handler = create_dim_handler(self.dims)
+        parameters = {
+            param: self._create_parameter(param, value, name)
+            for param, value in self.parameters.items()
+        }
+        mu_log = pt.log(
+            parameters["mu"] ** 2
+            / pt.sqrt(parameters["mu"] ** 2 + parameters["sigma"] ** 2)
+        )
+        sigma_log = pt.sqrt(
+            pt.log(1 + (parameters["sigma"] ** 2 / parameters["mu"] ** 2))
+        )
+
+        if self.centered:
+            log_phi = pm.Normal(
+                name + "_log", mu=mu_log, sigma=sigma_log, dims=self.dims
+            )
+
+        else:
+            log_phi_z = pm.Normal(
+                name + "_log" + "_offset", mu=0, sigma=1, dims=self.dims
+            )
+            log_phi = mu_log + log_phi_z * sigma_log
+
+        phi = pm.math.exp(log_phi)
+        phi = pm.Deterministic(name, phi, dims=self.dims)
+
+        return phi
+
+    def to_dict(self):
+        """Convert the prior distribution to a dictionary."""
+        data = {
+            "special_prior": "LogNormalPositiveParam",
+        }
+        if self.parameters:
+
+            def handle_value(value):
+                if isinstance(value, Prior):
+                    return value.to_dict()
+
+                if isinstance(value, pt.TensorVariable):
+                    value = value.eval()
+
+                if isinstance(value, np.ndarray):
+                    return value.tolist()
+
+                if hasattr(value, "to_dict"):
+                    return value.to_dict()
+
+                return value
+
+            data["kwargs"] = {
+                param: handle_value(value) for param, value in self.parameters.items()
+            }
+        if not self.centered:
+            data["centered"] = False
+
+        if self.dims:
+            data["dims"] = self.dims
+
+        return data
+
+    @classmethod
+    def from_dict(cls, data) -> Prior:
+        """Create a LogNormalPositiveParam prior from a dictionary."""
+        if not isinstance(data, dict):
+            msg = (
+                "Must be a dictionary representation of a prior distribution. "
+                f"Not of type: {type(data)}"
+            )
+            raise ValueError(msg)
+
+        kwargs = data.get("kwargs", {})
+
+        def handle_value(value):
+            if isinstance(value, dict):
+                return deserialize(value)
+
+            if isinstance(value, list):
+                return np.array(value)
+
+            return value
+
+        kwargs = {param: handle_value(value) for param, value in kwargs.items()}
+        centered = data.get("centered", True)
+        dims = data.get("dims")
+        if isinstance(dims, list):
+            dims = tuple(dims)
+
+        return cls(dims=dims, centered=centered, **kwargs)
+
+    def sample_prior(
+        self,
+        coords=None,
+        name: str = "variable",
+        **sample_prior_predictive_kwargs,
+    ) -> xr.Dataset:
+        """Sample from the prior distribution."""
+        return sample_prior(
+            factory=self,
+            coords=coords,
+            name=name,
+            **sample_prior_predictive_kwargs,
+        )
+
+
+def _is_lognormalpositiveparam_type(data: dict) -> bool:
+    if "special_prior" in data:
+        return data["special_prior"] == "LogNormalPositiveParam"
+    else:
+        return False
+
+
+register_deserialization(
+    is_type=_is_lognormalpositiveparam_type,
+    deserialize=LogNormalPositiveParam.from_dict,
+)
diff --git a/tests/test_special_priors.py b/tests/test_special_priors.py
@@ -0,0 +1,81 @@
+#   Copyright 2022 - 2025 The PyMC Labs Developers
+#
+#   Licensed under the Apache License, Version 2.0 (the "License");
+#   you may not use this file except in compliance with the License.
+#   You may obtain a copy of the License at
+#
+#       http://www.apache.org/licenses/LICENSE-2.0
+#
+#   Unless required by applicable law or agreed to in writing, software
+#   distributed under the License is distributed on an "AS IS" BASIS,
+#   WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+#   See the License for the specific language governing permissions and
+#   limitations under the License.
+
+import numpy as np
+import pymc as pm
+import pytest
+import xarray as xr
+from pymc_extras.prior import Prior
+
+from pymc_marketing.special_priors import (
+    LogNormalPositiveParam,
+    _is_lognormalpositiveparam_type,
+)
+
+
+@pytest.mark.parametrize(
+    "mu, sigma, centered, dims",
+    [
+        (
+            Prior("Gamma", mu=1.0, sigma=1.0),
+            Prior("Gamma", mu=1.0, sigma=1.0),
+            True,
+            ("channel",),
+        ),
+        (1.0, 2.0, False, ("channel",)),
+        (1.0, 2.0, True, ("channel",)),
+        (np.array([1, 2, 3]), np.array([4, 5, 6]), True, ("channel",)),
+        (np.array([1, 2, 3]), np.array([4, 5, 6]), False, ("channel",)),
+        (1.0, 2.0, True, ()),
+    ],
+)
+def test_LogNormalPositiveParam_args(mu, sigma, centered, dims):
+    """
+    Checks:
+    - sample_prior runs
+    - create_variable runs
+    - round trip: dict to class to dict to class, doesn't lose any information
+    """
+    rv = LogNormalPositiveParam(mu=mu, sigma=sigma, centered=centered, dims=dims)
+
+    coords = {"channel": ["C1", "C2", "C3"]}
+
+    if dims:
+        prior = rv.sample_prior(coords=coords)
+        assert prior.channel.shape == (len(coords["channel"]),)
+    else:
+        prior = rv.sample_prior()
+        assert isinstance(prior, xr.Dataset)
+
+    if centered is False:
+        assert "variable_log_offset" in prior.data_vars
+
+    with pm.Model(coords=coords):
+        rv.create_variable("test")
+
+    assert rv.to_dict() == rv.from_dict(rv.to_dict()).to_dict()
+
+
+def test_LogNormalPositiveParam_args_invalid():
+    with pytest.raises(ValueError):
+        LogNormalPositiveParam(alpha=1.0, beta=1.0)
+
+
+def test_the_deserializer_can_distinguish_between_types_of_prior_classes():
+    assert _is_lognormalpositiveparam_type(
+        LogNormalPositiveParam(mu=1.0, sigma=1.0).to_dict()
+    )
+    assert not _is_lognormalpositiveparam_type(
+        Prior("Normal", mu=1.0, sigma=1.0).to_dict()
+    )