factor out functionality for computing the gradient of a ModelFunction from ConfidenceRegionFactoryView.compute_confidence_interval(...) function, moving it to its own public instance method.

rileyjmurray · rileyjmurray · commit 904c2d92007e · 2025-07-08T11:02:14.000-07:00
diff --git a/pygsti/models/explicitcalc.py b/pygsti/models/explicitcalc.py
@@ -16,6 +16,7 @@
 import warnings as _warnings
 
 import numpy as _np
+import scipy.linalg as _la
 
 from pygsti.baseobjs import basisconstructors as _bc
 from pygsti.tools import matrixtools as _mt
@@ -609,17 +610,13 @@ def nongauge_and_gauge_spaces(self, item_weights=None, non_gauge_mix_mx=None):
         else:
             orthog_to = gauge_space
 
+        u,s,_ = _la.svd(orthog_to, full_matrices=True, compute_uv=True)
+        TOL = 1e-7
+        r = _np.count_nonzero(s >= TOL*s[0])
+        gauge_space    = u[:, :r]
+        nongauge_space = u[:, r:] 
+
         #OLD: nongauge_space = _mt.nullspace(orthog_to.T) #cols are non-gauge directions
-        nongauge_space = _mt.nullspace_qr(orthog_to.T)  # cols are non-gauge directions
-        # print("DB: nullspace of gen_dG (shape = %s, rank=%d) = %s" \
-        #       % (str(gen_dG.shape),_np.linalg.matrix_rank(gen_dG),str(gen_ndG.shape)))
-
-        #REMOVE
-        ## reduce gen_dG if it doesn't have full rank
-        #u, s, vh = _np.linalg.svd(gen_dG, full_matrices=False)
-        #rank = _np.count_nonzero(s > P_RANK_TOL)
-        #if rank < gen_dG.shape[1]:
-        #    gen_dG = u[:, 0:rank]
 
         assert(nongauge_space.shape[0] == gauge_space.shape[0] == nongauge_space.shape[1] + gauge_space.shape[1])
         return nongauge_space, gauge_space
diff --git a/pygsti/protocols/confidenceregionfactory.py b/pygsti/protocols/confidenceregionfactory.py
@@ -16,6 +16,7 @@
 import warnings as _warnings
 
 import numpy as _np
+import scipy.linalg as _la
 import scipy.stats as _stats
 
 from pygsti import optimize as _opt
@@ -654,16 +655,21 @@ def _project_hessian(self, hessian, nongauge_space, gauge_space, gradient=None):
         # to transform H -> H' in another coordinate system v -> w = B @ v:
         # v.T @ H @ v = some 2nd deriv = v.T @ B.T @ H' @ B @ v in another basis
         # so H' = invB.T @ H @ invB
-        assert(_np.allclose(hessian, hessian.T))
+        TOL = 1e-7
+        assert(_la.norm(hessian.imag) == 0)
+        sym_err_abs = _la.norm(hessian - hessian.T)
+        sym_err_rel = sym_err_abs / _la.norm(hessian)
+        assert(sym_err_rel < TOL)
+        hessian += hessian.T
+        hessian /= 2
         invB = _np.concatenate([nongauge_space, gauge_space], axis=1)  # takes (nongauge,guage) -> orig coords
         B = _np.linalg.inv(invB)  # takes orig -> (nongauge,gauge) coords
         Hprime = invB.T @ hessian @ invB
-        #assert(_np.allclose(Hprime, Hprime.T))  # doesn't handle large magnituge Hessians well
-        assert(_np.linalg.norm(Hprime - Hprime.T) / _np.linalg.norm(Hprime) < 1e-7)
+        assert(_la.norm(Hprime.imag) == 0)
 
         if gradient is not None:  # Check that Hprime is block-diagonal -- off-diag should be ~O(gradient)
             coupling = Hprime[0:nongauge_space.shape[1], nongauge_space.shape[1]:]
-            if _np.linalg.norm(coupling) / (1e-6 + _np.linalg.norm(gradient)) > 5:
+            if _np.linalg.norm(coupling) / (10*TOL + _np.linalg.norm(gradient)) > 5:
                 _warnings.warn("Gauge-nongauge mixed partials have unusually high magnitude: \n"
                                + "|off-diag blk| = %.2g should be ~ |gradient| = %.2g" %
                                (_np.linalg.norm(coupling), _np.linalg.norm(gradient)))
@@ -1013,47 +1019,7 @@ def retrieve_profile_likelihood_confidence_intervals(self, label=None, component
             raise ValueError(("Invalid item label (%s) for computing" % label)
                              + "profile likelihood confidence intervals")
 
-    def compute_confidence_interval(self, fn_obj, eps=1e-7,
-                                    return_fn_val=False, verbosity=0):
-        """
-        Compute the confidence interval for an arbitrary function.
-
-        This "function", however, must be encapsulated as a
-        `ModelFunction` object, which allows it to neatly specify
-        what its dependencies are and allows it to compaute finite-
-        different derivatives more efficiently.
-
-        Parameters
-        ----------
-        fn_obj : ModelFunction
-            An object representing the function to evaluate. The
-            returned confidence interval is based on linearizing this function
-            and propagating the model-space confidence region.
-
-        eps : float, optional
-            Step size used when taking finite-difference derivatives of fnOfOp.
-
-        return_fn_val : bool, optional
-            If True, return the value of fnOfOp along with it's confidence
-            region half-widths.
-
-        verbosity : int, optional
-            Specifies level of detail in standard output.
-
-        Returns
-        -------
-        df : float or numpy array
-            Half-widths of confidence intervals for each of the elements
-            in the float or array returned by fnOfOp.  Thus, shape of
-            df matches that returned by fnOfOp.
-        f0 : float or numpy array
-            Only returned when return_fn_val == True. Value of fnOfOp
-            at the gate specified by op_label.
-        """
-
-        nParams = self.model.num_params
-        f0 = fn_obj.evaluate(self.model)  # function value at "base point"
-
+    def compute_grad_f(self, fn_obj, f0, nParams, eps=1e-7):
         #Get finite difference derivative gradF that is shape (nParams, <shape of f0>)
         gradF = _create_empty_grad_f(f0, nParams)
 
@@ -1105,6 +1071,51 @@ def compute_confidence_interval(self, fn_obj, eps=1e-7,
                 assert(_np.linalg.norm(_np.imag(f - f0)) < 1e-12 or _np.iscomplexobj(gradF)
                        ), "gradF seems to be the wrong type!"
                 gradF[igp] = _np.real_if_close(f - f0) / eps
+        return gradF
+    
+    def compute_confidence_interval(self, fn_obj, eps=1e-7,
+                                    return_fn_val=False, verbosity=0):
+        """
+        Compute the confidence interval for an arbitrary function.
+
+        This "function", however, must be encapsulated as a
+        `ModelFunction` object, which allows it to neatly specify
+        what its dependencies are and allows it to compaute finite-
+        different derivatives more efficiently.
+
+        Parameters
+        ----------
+        fn_obj : ModelFunction
+            An object representing the function to evaluate. The
+            returned confidence interval is based on linearizing this function
+            and propagating the model-space confidence region.
+
+        eps : float, optional
+            Step size used when taking finite-difference derivatives of fnOfOp.
+
+        return_fn_val : bool, optional
+            If True, return the value of fnOfOp along with it's confidence
+            region half-widths.
+
+        verbosity : int, optional
+            Specifies level of detail in standard output.
+
+        Returns
+        -------
+        df : float or numpy array
+            Half-widths of confidence intervals for each of the elements
+            in the float or array returned by fnOfOp.  Thus, shape of
+            df matches that returned by fnOfOp.
+        f0 : float or numpy array
+            Only returned when return_fn_val == True. Value of fnOfOp
+            at the gate specified by op_label.
+        """
+
+        nParams = self.model.num_params
+        f0 = fn_obj.evaluate(self.model)  # function value at "base point"
+
+        #Get finite difference derivative gradF that is shape (nParams, <shape of f0>)
+        gradF = self.compute_grad_f(fn_obj, f0, nParams, eps)
 
         return self._compute_return_from_grad_f(gradF, f0, return_fn_val, verbosity)