Constraint creation changes (#93)

willGraham01 · mscroggs · web-flow · commit 1414f8e62bcf · 2025-09-03T08:26:32.000Z
* Reinstate check after renaming caused bugs in sampling

* Remove old CausalProblem class

* Add barebones classes to be populated later

* Update two normal example test to use new infrastructure

* Rework so that the lagrangian can be passed model parameters and the multiplier values as separate args

* ruffing

* Refactor out g.model argument from the Lagrangian call

* Make TODOs obvious so I don't forget to do them

* Add docstrings and more TODOs

* Todo resolution and addition

* Make _CPConstraint callable

* Hide _CPComponent attributes that we don't expect to change

* Test __call__ for _CPComponents

* Add note about __call__ in docstring

* Fix bug in how handlers are applied

* Write tests for features

* Edit Constraint so it is created in pieces

* Rework Constraint.__init__ and docstring to match new format

* Update two_normal_example integration test

* Remove todo note

* Update src/causalprog/causal_problem/causal_estimand.py

Co-authored-by: Matthew Scroggs &lt;matthew.w.scroggs@gmail.com&gt;

---------

Co-authored-by: Matthew Scroggs &lt;matthew.w.scroggs@gmail.com&gt;
diff --git a/src/causalprog/causal_problem/causal_estimand.py b/src/causalprog/causal_problem/causal_estimand.py
@@ -3,6 +3,7 @@
 from collections.abc import Callable
 from typing import Any, Concatenate, TypeAlias
 
+import jax.numpy as jnp
 import numpy.typing as npt
 
 Model: TypeAlias = Callable[..., Any]
@@ -94,13 +95,74 @@ class Constraint(_CPComponent):
     and $\epsilon$ is some tolerance.
     """
 
-    # TODO: (https://github.com/UCL/causalprog/issues/89)
-    # Should explain that Constraint needs more inputs and slightly different
-    # interpretation of the `do_with_samples` object.
-    # Inputs:
-    # - include epsilon as an input (allows constraints to have different tolerances)
-    # - `do_with_samples` should just be $g(\theta)$. Then have the instance build the
-    #   full constraint that will need to be called in the Lagrangian.
-    # - $g$ still needs to be scalar valued? Allow a wrapper function to be applied in
-    #   the event $g$ is vector-valued.
-    # If we do this, will also need to override __call__...
+    data: npt.ArrayLike
+    tolerance: npt.ArrayLike
+    _outer_norm: Callable[[npt.ArrayLike], float]
+
+    def __init__(
+        self,
+        *effect_handlers: ModelMask,
+        model_quantity: Callable[..., npt.ArrayLike],
+        outer_norm: Callable[[npt.ArrayLike], float] | None = None,
+        data: npt.ArrayLike = 0.0,
+        tolerance: float = 1.0e-6,
+    ) -> None:
+        r"""
+        Create a new constraint.
+
+        Constraints have the form
+
+        $$ c(\theta) :=
+        \mathrm{norm}\left( g(\theta)
+        - g_{\mathrm{data}} \right)
+        - \epsilon $$
+
+        where;
+        - $\mathrm{norm}$ is the outer norm of the constraint (`outer_norm`),
+        - $g(\theta)$ is the model quantity involved in the constraint
+            (`model_quantity`),
+        - $g_{\mathrm{data}}$ is the observed data (`data`),
+        - $\epsilon$ is the tolerance in the data (`tolerance`).
+
+        In a causal problem, each constraint appears as the condition $c(\theta)\leq 0$
+        in the minimisation / maximisation (hence the inclusion of the $-\epsilon$
+        term within $c(\theta)$ itself).
+
+        $g$ should be a (possibly vector-valued) function that acts on (a subset of)
+        samples from the random variables of the causal problem. It must accept
+        variable keyword-arguments only, and should access the samples for each random
+        variable by indexing via the RV names (node labels). It should return the
+        model quantity as computed from the samples, that $g_{\mathrm{data}}$ observed.
+
+        $g_{\mathrm{data}}$ should be a fixed value whose shape is broadcast-able with
+        the return shape of $g$. It defaults to $0$ if not explicitly set.
+
+        $\mathrm{norm}$ should be a suitable norm to take on the difference between the
+        model quantity as predicted by the samples ($g$) and the observed data
+        ($g_{\mathrm{data}}$). It must return a scalar value. The default is the 2-norm.
+        """
+        super().__init__(*effect_handlers, do_with_samples=model_quantity)
+
+        if outer_norm is None:
+            self._outer_norm = jnp.linalg.vector_norm
+        else:
+            self._outer_norm = outer_norm
+
+        self.data = data
+        self.tolerance = tolerance
+
+    def __call__(self, samples: dict[str, npt.ArrayLike]) -> npt.ArrayLike:
+        """
+        Evaluate the constraint, given RV samples.
+
+        Args:
+            samples: Mapping of RV (node) labels to drawn samples.
+
+        Returns:
+            Value of the constraint.
+
+        """
+        return (
+            self._outer_norm(self._do_with_samples(**samples) - self.data)
+            - self.tolerance
+        )
diff --git a/tests/test_integration/test_two_normal_example.py b/tests/test_integration/test_two_normal_example.py
@@ -78,7 +78,9 @@ def test_two_normal_example(
     # Setup the optimisation problem from the graph
     ce = CausalEstimand(do_with_samples=lambda **pv: pv["X"].mean())
     con = Constraint(
-        do_with_samples=lambda **pv: jnp.abs(pv["UX"].mean() - phi_observed) - epsilon
+        model_quantity=lambda **pv: pv["UX"].mean(),
+        data=phi_observed,
+        tolerance=epsilon,
     )
     cp = CausalProblem(
         two_normal_graph(cov=1.0),