From 35062fb93c812e1b2319a7878d1992d2453d95ac Mon Sep 17 00:00:00 2001
From: davidwalter2 <david.walter@cern.ch>
Date: Thu, 1 Jan 2026 14:14:02 -0500
Subject: [PATCH 1/5] Premature work on BB full with gamma

---
 rabbit/fitter.py | 104 ++++++++++++++++++++++++++++++++++++-----------
 1 file changed, 80 insertions(+), 24 deletions(-)

diff --git a/rabbit/fitter.py b/rabbit/fitter.py
index 2233cc6..e8a367f 100644
--- a/rabbit/fitter.py
+++ b/rabbit/fitter.py
@@ -67,14 +67,14 @@ def __init__(
         else:
             self.binByBinStatType = options.binByBinStatType
 
-        if (
-            self.binByBinStat
-            and self.binByBinStatMode == "full"
-            and not self.binByBinStatType.startswith("normal")
-        ):
-            raise Exception(
-                'bin-by-bin stat only for option "--binByBinStatMode full" with "--binByBinStatType normal"'
-            )
+        # if (
+        #     self.binByBinStat
+        #     and self.binByBinStatMode == "full"
+        #     and not self.binByBinStatType.startswith("normal")
+        # ):
+        #     raise Exception(
+        #         'bin-by-bin stat only for option "--binByBinStatMode full" with "--binByBinStatType normal"'
+        #     )
 
         if (
             options.covarianceFit
@@ -1390,15 +1390,36 @@ def _compute_yields_with_beta(self, profile=True, compute_norm=False, full=True)
 
                 if self.chisqFit:
                     if self.binByBinStatType == "gamma":
+
                         kstat = self.kstat[: self.indata.nbins]
+                        if self.binByBinStatMode == "lite":
+                            abeta = nexp_profile**2
+                            bbeta = kstat * self.varnobs - nexp_profile * self.nobs
+                            cbeta = -kstat * self.varnobs * beta0
+                            beta = solve_quad_eq(abeta, bbeta, cbeta)
 
-                        abeta = nexp_profile**2
-                        bbeta = kstat * self.varnobs - nexp_profile * self.nobs
-                        cbeta = -kstat * self.varnobs * beta0
-                        beta = solve_quad_eq(abeta, bbeta, cbeta)
+                            betamask = self.betamask[: self.indata.nbins]
+                            beta = tf.where(betamask, beta0, beta)
+
+                        elif self.binByBinStatMode == "full":
+                            # compute sum of processes from Gaussian approximation
+                            norm_profile = norm[: self.indata.nbins]
+                            n2kstat = tf.square(norm_profile) / kstat
+                            n2kstat = tf.where(
+                                betamask,
+                                tf.constant(0.0, dtype=self.indata.dtype),
+                                n2kstat,
+                            )
+                            n2kstatsum = tf.reduce_sum(n2kstat, axis=-1)
+
+                            nbeta = (
+                                self.nobs / self.varnobs * n2kstatsum
+                                + tf.reduce_sum(norm_profile * beta0, axis=-1)
+                            ) / (1 + 1 / self.varnobs * n2kstatsum)
+
+                            # individual beta parameter from Gamma distribution
+                            # TODO
 
-                        betamask = self.betamask[: self.indata.nbins]
-                        beta = tf.where(betamask, beta0, beta)
                     elif self.binByBinStatType == "normal-multiplicative":
                         kstat = self.kstat[: self.indata.nbins]
                         betamask = self.betamask[: self.indata.nbins]
@@ -1406,9 +1427,6 @@ def _compute_yields_with_beta(self, profile=True, compute_norm=False, full=True)
                             beta = (
                                 nexp_profile * self.nobs / self.varnobs + kstat * beta0
                             ) / (kstat + nexp_profile * nexp_profile / self.varnobs)
-
-                            beta = tf.where(betamask, beta0, beta)
-
                         elif self.binByBinStatMode == "full":
                             norm_profile = norm[: self.indata.nbins]
                             n2kstat = tf.square(norm_profile) / kstat
@@ -1429,7 +1447,7 @@ def _compute_yields_with_beta(self, profile=True, compute_norm=False, full=True)
                                 * norm_profile
                                 / kstat
                             )
-                            beta = tf.where(betamask, beta0, beta)
+                        beta = tf.where(betamask, beta0, beta)
                     elif self.binByBinStatType == "normal-additive":
                         varbeta = self.varbeta[: self.indata.nbins]
                         sbeta = tf.math.sqrt(varbeta)
@@ -1475,7 +1493,6 @@ def _compute_yields_with_beta(self, profile=True, compute_norm=False, full=True)
                             beta = tf.linalg.solve(A, b)
 
                             beta = tf.squeeze(beta, axis=-1)
-                            beta = tf.where(betamask, beta0, beta)
                         elif self.binByBinStatMode == "full":
                             norm_profile = norm[: self.indata.nbins]
 
@@ -1509,7 +1526,7 @@ def _compute_yields_with_beta(self, profile=True, compute_norm=False, full=True)
                             beta = beta0 - norm_profile / kstat * (
                                 self.data_cov_inv @ (nbeta - self.nobs[:, None])
                             )
-                            beta = tf.where(betamask, beta0, beta)
+                        beta = tf.where(betamask, beta0, beta)
                     elif self.binByBinStatType == "normal-additive":
                         varbeta = self.varbeta[: self.indata.nbins]
                         sbeta = tf.math.sqrt(varbeta)
@@ -1546,8 +1563,34 @@ def _compute_yields_with_beta(self, profile=True, compute_norm=False, full=True)
                         kstat = self.kstat[: self.indata.nbins]
                         betamask = self.betamask[: self.indata.nbins]
 
-                        beta = (self.nobs + kstat * beta0) / (nexp_profile + kstat)
+                        if self.binByBinStatMode == "lite":
+                            beta = (self.nobs + kstat * beta0) / (nexp_profile + kstat)
+                        elif self.binByBinStatMode == "full":
+                            # compute sum of processes from Gaussian approximation
+                            norm_profile = norm[: self.indata.nbins]
+                            n2kstat = tf.square(norm_profile) / kstat
+                            n2kstat = tf.where(
+                                betamask,
+                                tf.constant(0.0, dtype=self.indata.dtype),
+                                n2kstat,
+                            )
+                            pbeta = tf.reduce_sum(
+                                n2kstat - beta0 * norm_profile, axis=-1
+                            )
+                            qbeta = -self.nobs * tf.reduce_sum(n2kstat, axis=-1)
+                            nbeta = solve_quad_eq(1, pbeta, qbeta)
+                            # individual beta parameter from Gamma distribution
+                            beta = (
+                                kstat
+                                * beta0
+                                / (
+                                    norm_profile
+                                    - (self.nobs / nbeta)[..., None] * norm_profile
+                                    + kstat
+                                )
+                            )
                         beta = tf.where(betamask, beta0, beta)
+
                     elif self.binByBinStatType == "normal-multiplicative":
                         kstat = self.kstat[: self.indata.nbins]
                         betamask = self.betamask[: self.indata.nbins]
@@ -1556,7 +1599,6 @@ def _compute_yields_with_beta(self, profile=True, compute_norm=False, full=True)
                             bbeta = nexp_profile - beta0 * kstat
                             cbeta = -self.nobs
                             beta = solve_quad_eq(abeta, bbeta, cbeta)
-                            beta = tf.where(betamask, beta0, beta)
                         elif self.binByBinStatMode == "full":
                             norm_profile = norm[: self.indata.nbins]
                             n2kstat = tf.square(norm_profile) / kstat
@@ -1576,7 +1618,7 @@ def _compute_yields_with_beta(self, profile=True, compute_norm=False, full=True)
                                 * norm_profile
                                 / kstat
                             )
-                            beta = tf.where(betamask, beta0, beta)
+                        beta = tf.where(betamask, beta0, beta)
                     elif self.binByBinStatType == "normal-additive":
                         varbeta = self.varbeta[: self.indata.nbins]
                         sbeta = tf.math.sqrt(varbeta)
@@ -1965,6 +2007,10 @@ def _compute_nll_components(self, profile=True, full_nll=False):
 
         lc = self._compute_lc(full_nll)
 
+        import pdb
+
+        pdb.set_trace()
+
         lbeta = self._compute_lbeta(beta, full_nll)
 
         return ln, lc, lbeta, beta
@@ -1975,9 +2021,19 @@ def _compute_nll(self, profile=True, full_nll=False):
         )
         l = ln + lc
 
-        if lbeta is not None:
+        if self.binByBinStat:
             l = l + lbeta
 
+        logger.debug(f"{ln=}; {lc=}; {lbeta=}")
+
+        logger.debug(f"{beta=}")
+
+        betamin = tf.reduce_min(beta)
+        betamax = tf.reduce_max(beta)
+
+        logger.debug(f"{betamin=}")
+        logger.debug(f"{betamax=}")
+
         return l
 
     def _compute_loss(self, profile=True):

From 802478c327dfaa887dc2fe5796a55b7e711169dd Mon Sep 17 00:00:00 2001
From: davidwalter2 <david.walter@cern.ch>
Date: Thu, 1 Jan 2026 15:12:06 -0500
Subject: [PATCH 2/5] First attempt for bin by bin full with gamma

---
 rabbit/fitter.py | 145 +++++++++++++++++++++++++++++++----------------
 1 file changed, 97 insertions(+), 48 deletions(-)

diff --git a/rabbit/fitter.py b/rabbit/fitter.py
index e8a367f..8da7e7d 100644
--- a/rabbit/fitter.py
+++ b/rabbit/fitter.py
@@ -67,15 +67,6 @@ def __init__(
         else:
             self.binByBinStatType = options.binByBinStatType
 
-        # if (
-        #     self.binByBinStat
-        #     and self.binByBinStatMode == "full"
-        #     and not self.binByBinStatType.startswith("normal")
-        # ):
-        #     raise Exception(
-        #         'bin-by-bin stat only for option "--binByBinStatMode full" with "--binByBinStatType normal"'
-        #     )
-
         if (
             options.covarianceFit
             and self.binByBinStat
@@ -125,15 +116,32 @@ def __init__(
             )
             self.init_blinding_values(options.unblind)
 
-        self.parms = np.concatenate([self.poi_model.pois, self.indata.systs])
-
+        parms = [self.poi_model.pois, self.indata.systs]
         # tf variable containing all fit parameters
         thetadefault = tf.zeros([self.indata.nsyst], dtype=self.indata.dtype)
         if self.poi_model.npoi > 0:
-            xdefault = tf.concat([self.poi_model.xpoidefault, thetadefault], axis=0)
+            xdefault = [self.poi_model.xpoidefault, thetadefault]
         else:
-            xdefault = thetadefault
+            xdefault = [thetadefault]
+        if self.binByBinStatType == "gamma" and self.binByBinStatMode == "full":
+            # explicit parameters for nbeta define as: nbeta = sum(beta_j n_j)/ sum(n_j)
+            nbetadefault = tf.ones([self.indata.nbins], dtype=self.indata.dtype)
+            xdefault.append(nbetadefault)
+            self.nbeta0 = tf.Variable(
+                tf.ones(self.indata.nbins, dtype=self.indata.dtype),
+                trainable=False,
+                name="nbeta0",
+            )
+            parms_nbeta = np.char.add(
+                "nbeta_", np.arange(self.indata.nbins).astype(str)
+            )
+            parms.append(parms_nbeta)
 
+        self.parms = np.concatenate(parms)
+        if len(xdefault) > 1:
+            xdefault = tf.concat(xdefault, axis=0)
+        else:
+            xdefault = xdefault[0]
         self.x = tf.Variable(xdefault, trainable=True, name="x")
 
         # for freezing parameters
@@ -389,8 +397,17 @@ def set_blinding_offsets(self, blind=True):
                 np.zeros(self.indata.nsyst, dtype=np.float64)
             )
 
+    def get_nbeta(self):
+        nbeta = self.x[
+            self.poi_model.npoi
+            + self.indata.nsyst : self.poi_model.npoi
+            + self.indata.nsyst
+            + self.indata.nbins
+        ]
+        return nbeta
+
     def get_blinded_theta(self):
-        theta = self.x[self.poi_model.npoi :]
+        theta = self.x[self.poi_model.npoi : self.poi_model.npoi + self.indata.nsyst]
         if self.do_blinding:
             return theta + self._blinding_offsets_theta
         else:
@@ -424,8 +441,14 @@ def prefit_covariance(self, unconstrained_err=0.0):
             unconstrained_err**2,
             tf.math.reciprocal(self.indata.constraintweights),
         )
+        vars = [var_poi, var_theta]
+
+        if self.binByBinStatType == "gamma" and self.binByBinStatMode == "full":
+            # uncertainty from explicit nbeta parameters are accounted for by implicit beta parameters
+            var_nbeta = tf.zeros([self.indata.nbins], dtype=self.indata.dtype)
+            vars.append(var_nbeta)
 
-        invhessianprefit = tf.linalg.diag(tf.concat([var_poi, var_theta], axis=0))
+        invhessianprefit = tf.linalg.diag(tf.concat(vars, axis=0))
         return invhessianprefit
 
     @tf.function
@@ -465,9 +488,19 @@ def theta0defaultassign(self):
 
     def xdefaultassign(self):
         if self.poi_model.npoi == 0:
-            self.x.assign(self.theta0)
+            to_assign = [self.theta0]
+        else:
+            to_assign = [self.poi_model.xpoidefault, self.theta0]
+
+        if self.binByBinStatType == "gamma" and self.binByBinStatMode == "full":
+            to_assign.append(self.nbeta0)
+
+        if len(to_assign) > 1:
+            to_assign = tf.concat(to_assign, axis=0)
         else:
-            self.x.assign(tf.concat([self.poi_model.xpoidefault, self.theta0], axis=0))
+            to_assign = to_assign[0]
+
+        self.x.assign(to_assign)
 
     def beta0defaultassign(self):
         self.set_beta0(self._default_beta0())
@@ -512,6 +545,10 @@ def bayesassign(self):
 
         if self.binByBinStat:
             if self.binByBinStatType == "gamma":
+                if self.binByBinStatMode == "full":
+                    raise NotImplementedError(
+                        "Barlow-Beeston full with gamma is not yet implemented"
+                    )
                 # FIXME this is only valid for beta0=beta=1 (but this should always be the case when throwing toys)
                 betagen = (
                     tf.random.gamma(
@@ -547,6 +584,10 @@ def frequentistassign(self):
         )
         if self.binByBinStat:
             if self.binByBinStatType == "gamma":
+                if self.binByBinStatMode == "full":
+                    raise NotImplementedError(
+                        "Barlow-Beeston full with gamma is not yet implemented"
+                    )
                 # FIXME this is only valid for beta0=beta=1 (but this should always be the case when throwing toys)
                 beta0gen = (
                     tf.random.poisson(
@@ -1291,7 +1332,9 @@ def _compute_yields_noBBB(self, full=True):
             self.frozen_params_mask[: self.poi_model.npoi], tf.stop_gradient(poi), poi
         )
         theta = tf.where(
-            self.frozen_params_mask[self.poi_model.npoi :],
+            self.frozen_params_mask[
+                self.poi_model.npoi : self.poi_model.npoi + self.indata.nsyst
+            ],
             tf.stop_gradient(theta),
             theta,
         )
@@ -1402,20 +1445,26 @@ def _compute_yields_with_beta(self, profile=True, compute_norm=False, full=True)
                             beta = tf.where(betamask, beta0, beta)
 
                         elif self.binByBinStatMode == "full":
-                            # compute sum of processes from Gaussian approximation
-                            norm_profile = norm[: self.indata.nbins]
-                            n2kstat = tf.square(norm_profile) / kstat
-                            n2kstat = tf.where(
-                                betamask,
-                                tf.constant(0.0, dtype=self.indata.dtype),
-                                n2kstat,
+                            # # compute sum of processes from Gaussian approximation
+                            # norm_profile = norm[: self.indata.nbins]
+                            # n2kstat = tf.square(norm_profile) / kstat
+                            # n2kstat = tf.where(
+                            #     betamask,
+                            #     tf.constant(0.0, dtype=self.indata.dtype),
+                            #     n2kstat,
+                            # )
+                            # n2kstatsum = tf.reduce_sum(n2kstat, axis=-1)
+
+                            # nbeta = (
+                            #     self.nobs / self.varnobs * n2kstatsum
+                            #     + tf.reduce_sum(norm_profile * beta0, axis=-1)
+                            # ) / (1 + 1 / self.varnobs * n2kstatsum)
+
+                            raise NotImplementedError(
+                                "Barlow-Beeston full with gamma not yet implemented in chisqFit"
                             )
-                            n2kstatsum = tf.reduce_sum(n2kstat, axis=-1)
 
-                            nbeta = (
-                                self.nobs / self.varnobs * n2kstatsum
-                                + tf.reduce_sum(norm_profile * beta0, axis=-1)
-                            ) / (1 + 1 / self.varnobs * n2kstatsum)
+                            nbeta = self.x[self.poi_model.npoi + self.indata.nsyst :]
 
                             # individual beta parameter from Gamma distribution
                             # TODO
@@ -1566,26 +1615,31 @@ def _compute_yields_with_beta(self, profile=True, compute_norm=False, full=True)
                         if self.binByBinStatMode == "lite":
                             beta = (self.nobs + kstat * beta0) / (nexp_profile + kstat)
                         elif self.binByBinStatMode == "full":
-                            # compute sum of processes from Gaussian approximation
                             norm_profile = norm[: self.indata.nbins]
-                            n2kstat = tf.square(norm_profile) / kstat
-                            n2kstat = tf.where(
-                                betamask,
-                                tf.constant(0.0, dtype=self.indata.dtype),
-                                n2kstat,
-                            )
-                            pbeta = tf.reduce_sum(
-                                n2kstat - beta0 * norm_profile, axis=-1
-                            )
-                            qbeta = -self.nobs * tf.reduce_sum(n2kstat, axis=-1)
-                            nbeta = solve_quad_eq(1, pbeta, qbeta)
+
+                            # # compute sum of processes from Gaussian approximation
+                            # n2kstat = tf.square(norm_profile) / kstat
+                            # n2kstat = tf.where(
+                            #     betamask,
+                            #     tf.constant(0.0, dtype=self.indata.dtype),
+                            #     n2kstat,
+                            # )
+                            # pbeta = tf.reduce_sum(
+                            #     n2kstat - beta0 * norm_profile, axis=-1
+                            # )
+                            # qbeta = -self.nobs * tf.reduce_sum(n2kstat, axis=-1)
+                            # nbeta = solve_quad_eq(1, pbeta, qbeta)
+
+                            nbeta = self.x[self.poi_model.npoi + self.indata.nsyst :]
+
                             # individual beta parameter from Gamma distribution
                             beta = (
                                 kstat
                                 * beta0
                                 / (
                                     norm_profile
-                                    - (self.nobs / nbeta)[..., None] * norm_profile
+                                    - (self.nobs / (nexp_profile * nbeta))[..., None]
+                                    * norm_profile
                                     + kstat
                                 )
                             )
@@ -2006,11 +2060,6 @@ def _compute_nll_components(self, profile=True, full_nll=False):
                 )
 
         lc = self._compute_lc(full_nll)
-
-        import pdb
-
-        pdb.set_trace()
-
         lbeta = self._compute_lbeta(beta, full_nll)
 
         return ln, lc, lbeta, beta

From d94dc0cfc9212ff2dc113ccfd94b0aaee51ab492 Mon Sep 17 00:00:00 2001
From: davidwalter2 <david.walter@cern.ch>
Date: Thu, 1 Jan 2026 16:45:40 -0500
Subject: [PATCH 3/5] Fix edmval for bb full

---
 rabbit/fitter.py | 91 +++++++++++++++++-------------------------------
 1 file changed, 32 insertions(+), 59 deletions(-)

diff --git a/rabbit/fitter.py b/rabbit/fitter.py
index 5a5c5d3..8b5c195 100644
--- a/rabbit/fitter.py
+++ b/rabbit/fitter.py
@@ -238,10 +238,10 @@ def __init__(
                     self.varbeta = self.indata.sumw2
                     self.sumw = self.indata.sumw
 
+            self.betamask = (self.varbeta == 0.0) | (self.sumw == 0.0)
+
             if self.binByBinStatType in ["gamma", "normal-multiplicative"]:
-                self.kstat = self.sumw**2 / self.varbeta
-                self.betamask = (self.varbeta == 0.0) | (self.kstat == 0.0)
-                self.kstat = tf.where(self.betamask, 1.0, self.kstat)
+                self.kstat = tf.where(self.betamask, 1.0, self.sumw**2 / self.varbeta)
             elif self.binByBinStatType == "normal-additive":
                 # precompute decomposition of composite matrix to speed up
                 # calculation of profiled beta values
@@ -808,7 +808,12 @@ def envelope(values):
 
     def _compute_impact_group(self, v, idxs):
         cov_reduced = tf.gather(
-            self.cov[self.poi_model.npoi :, self.poi_model.npoi :], idxs, axis=0
+            self.cov[
+                self.poi_model.npoi : self.poi_model.npoi + self.indata.nsyst,
+                self.poi_model.npoi : self.poi_model.npoi + self.indata.nsyst,
+            ],
+            idxs,
+            axis=0,
         )
         cov_reduced = tf.gather(cov_reduced, idxs, axis=1)
         v_reduced = tf.gather(v, idxs, axis=1)
@@ -820,7 +825,10 @@ def _gather_poi_noi_vector(self, v):
         v_poi = v[: self.poi_model.npoi]
         # protection for constained NOIs, set them to 0
         mask = (self.indata.noiidxs >= 0) & (
-            self.indata.noiidxs < tf.shape(v[self.poi_model.npoi :])[0]
+            self.indata.noiidxs
+            < tf.shape(
+                v[self.poi_model.npoi : self.poi_model.npoi + self.indata.nsyst]
+            )[0]
         )
         safe_idxs = tf.where(mask, self.indata.noiidxs, 0)
         mask = tf.cast(mask, v.dtype)
@@ -830,7 +838,13 @@ def _gather_poi_noi_vector(self, v):
                 [tf.shape(mask), tf.ones(tf.rank(v) - 1, dtype=tf.int32)], axis=0
             ),
         )
-        v_noi = tf.gather(v[self.poi_model.npoi :], safe_idxs) * mask
+        v_noi = (
+            tf.gather(
+                v[self.poi_model.npoi : self.poi_model.npoi + self.indata.nsyst],
+                safe_idxs,
+            )
+            * mask
+        )
         v_gathered = tf.concat([v_poi, v_noi], axis=0)
         return v_gathered
 
@@ -870,7 +884,8 @@ def impacts_parms(self, hess):
         if len(self.indata.systgroupidxs):
             impacts_grouped_syst = tf.map_fn(
                 lambda idxs: self._compute_impact_group(
-                    v[:, self.poi_model.npoi :], idxs
+                    v[:, self.poi_model.npoi : self.poi_model.npoi + self.indata.nsyst],
+                    idxs,
                 ),
                 tf.ragged.constant(self.indata.systgroupidxs, dtype=tf.int32),
                 fn_output_signature=tf.TensorSpec(
@@ -1444,6 +1459,7 @@ def _compute_yields_with_beta(self, profile=True, compute_norm=False, full=True)
 
                 nexp_profile = nexp[: self.indata.nbins]
                 beta0 = self.beta0[: self.indata.nbins]
+                betamask = self.betamask[: self.indata.nbins]
 
                 if self.chisqFit:
                     if self.binByBinStatType == "gamma":
@@ -1454,26 +1470,7 @@ def _compute_yields_with_beta(self, profile=True, compute_norm=False, full=True)
                             bbeta = kstat * self.varnobs - nexp_profile * self.nobs
                             cbeta = -kstat * self.varnobs * beta0
                             beta = solve_quad_eq(abeta, bbeta, cbeta)
-
-                            betamask = self.betamask[: self.indata.nbins]
-                            beta = tf.where(betamask, beta0, beta)
-
                         elif self.binByBinStatMode == "full":
-                            # # compute sum of processes from Gaussian approximation
-                            # norm_profile = norm[: self.indata.nbins]
-                            # n2kstat = tf.square(norm_profile) / kstat
-                            # n2kstat = tf.where(
-                            #     betamask,
-                            #     tf.constant(0.0, dtype=self.indata.dtype),
-                            #     n2kstat,
-                            # )
-                            # n2kstatsum = tf.reduce_sum(n2kstat, axis=-1)
-
-                            # nbeta = (
-                            #     self.nobs / self.varnobs * n2kstatsum
-                            #     + tf.reduce_sum(norm_profile * beta0, axis=-1)
-                            # ) / (1 + 1 / self.varnobs * n2kstatsum)
-
                             raise NotImplementedError(
                                 "Barlow-Beeston full with gamma not yet implemented in chisqFit"
                             )
@@ -1485,7 +1482,6 @@ def _compute_yields_with_beta(self, profile=True, compute_norm=False, full=True)
 
                     elif self.binByBinStatType == "normal-multiplicative":
                         kstat = self.kstat[: self.indata.nbins]
-                        betamask = self.betamask[: self.indata.nbins]
                         if self.binByBinStatMode == "lite":
                             beta = (
                                 nexp_profile * self.nobs / self.varnobs + kstat * beta0
@@ -1510,7 +1506,6 @@ def _compute_yields_with_beta(self, profile=True, compute_norm=False, full=True)
                                 * norm_profile
                                 / kstat
                             )
-                        beta = tf.where(betamask, beta0, beta)
                     elif self.binByBinStatType == "normal-additive":
                         varbeta = self.varbeta[: self.indata.nbins]
                         sbeta = tf.math.sqrt(varbeta)
@@ -1535,7 +1530,6 @@ def _compute_yields_with_beta(self, profile=True, compute_norm=False, full=True)
                 elif self.covarianceFit:
                     if self.binByBinStatType == "normal-multiplicative":
                         kstat = self.kstat[: self.indata.nbins]
-                        betamask = self.betamask[: self.indata.nbins]
                         if self.binByBinStatMode == "lite":
 
                             nexp_profile_m = tf.linalg.LinearOperatorDiag(nexp_profile)
@@ -1589,7 +1583,6 @@ def _compute_yields_with_beta(self, profile=True, compute_norm=False, full=True)
                             beta = beta0 - norm_profile / kstat * (
                                 self.data_cov_inv @ (nbeta - self.nobs[:, None])
                             )
-                        beta = tf.where(betamask, beta0, beta)
                     elif self.binByBinStatType == "normal-additive":
                         varbeta = self.varbeta[: self.indata.nbins]
                         sbeta = tf.math.sqrt(varbeta)
@@ -1624,26 +1617,10 @@ def _compute_yields_with_beta(self, profile=True, compute_norm=False, full=True)
                 else:
                     if self.binByBinStatType == "gamma":
                         kstat = self.kstat[: self.indata.nbins]
-                        betamask = self.betamask[: self.indata.nbins]
-
                         if self.binByBinStatMode == "lite":
                             beta = (self.nobs + kstat * beta0) / (nexp_profile + kstat)
                         elif self.binByBinStatMode == "full":
                             norm_profile = norm[: self.indata.nbins]
-
-                            # # compute sum of processes from Gaussian approximation
-                            # n2kstat = tf.square(norm_profile) / kstat
-                            # n2kstat = tf.where(
-                            #     betamask,
-                            #     tf.constant(0.0, dtype=self.indata.dtype),
-                            #     n2kstat,
-                            # )
-                            # pbeta = tf.reduce_sum(
-                            #     n2kstat - beta0 * norm_profile, axis=-1
-                            # )
-                            # qbeta = -self.nobs * tf.reduce_sum(n2kstat, axis=-1)
-                            # nbeta = solve_quad_eq(1, pbeta, qbeta)
-
                             nbeta = self.x[self.poi_model.npoi + self.indata.nsyst :]
 
                             # individual beta parameter from Gamma distribution
@@ -1657,11 +1634,9 @@ def _compute_yields_with_beta(self, profile=True, compute_norm=False, full=True)
                                     + kstat
                                 )
                             )
-                        beta = tf.where(betamask, beta0, beta)
 
                     elif self.binByBinStatType == "normal-multiplicative":
                         kstat = self.kstat[: self.indata.nbins]
-                        betamask = self.betamask[: self.indata.nbins]
                         if self.binByBinStatMode == "lite":
                             abeta = kstat
                             bbeta = nexp_profile - beta0 * kstat
@@ -1686,7 +1661,6 @@ def _compute_yields_with_beta(self, profile=True, compute_norm=False, full=True)
                                 * norm_profile
                                 / kstat
                             )
-                        beta = tf.where(betamask, beta0, beta)
                     elif self.binByBinStatType == "normal-additive":
                         varbeta = self.varbeta[: self.indata.nbins]
                         sbeta = tf.math.sqrt(varbeta)
@@ -1715,6 +1689,7 @@ def _compute_yields_with_beta(self, profile=True, compute_norm=False, full=True)
 
                             beta = beta0 + (self.nobs / nbeta - 1)[..., None] * sbeta
 
+                beta = tf.where(betamask, beta0, beta)
                 if self.indata.nbinsmasked:
                     beta = tf.concat([beta, self.beta0[self.indata.nbins :]], axis=0)
             else:
@@ -2087,16 +2062,6 @@ def _compute_nll(self, profile=True, full_nll=False):
         if self.binByBinStat:
             l = l + lbeta
 
-        logger.debug(f"{ln=}; {lc=}; {lbeta=}")
-
-        logger.debug(f"{beta=}")
-
-        betamin = tf.reduce_min(beta)
-        betamax = tf.reduce_max(beta)
-
-        logger.debug(f"{betamin=}")
-        logger.debug(f"{betamax=}")
-
         return l
 
     def _compute_loss(self, profile=True):
@@ -2168,6 +2133,14 @@ def loss_val_grad_hess_beta(self, profile=True):
             grad = t1.gradient(val, self.ubeta)
         hess = t2.jacobian(grad, self.ubeta)
 
+        grad = tf.reshape(grad, [-1])
+        hess = tf.reshape(hess, [grad.shape[0], grad.shape[0]])
+
+        betamask = ~tf.reshape(self.betamask, [-1])
+        grad = grad[betamask]
+        hess = tf.boolean_mask(hess, betamask, axis=0)
+        hess = tf.boolean_mask(hess, betamask, axis=1)
+
         return val, grad, hess
 
     def minimize(self):

From b7d9ec8078cf4eb9eadd29aa08e859138484e5a9 Mon Sep 17 00:00:00 2001
From: davidwalter2 <david.walter@cern.ch>
Date: Sun, 4 Jan 2026 10:47:28 -0500
Subject: [PATCH 4/5] Implement BB full with gamma for chisq fit; Implement
 impacts for BB full with gamma

---
 rabbit/fitter.py | 59 ++++++++++++++++++++++++++++++++++--------------
 1 file changed, 42 insertions(+), 17 deletions(-)

diff --git a/rabbit/fitter.py b/rabbit/fitter.py
index 8b5c195..a6a9605 100644
--- a/rabbit/fitter.py
+++ b/rabbit/fitter.py
@@ -851,12 +851,33 @@ def _gather_poi_noi_vector(self, v):
     @tf.function
     def impacts_parms(self, hess):
         # impact for poi at index i in covariance matrix from nuisance with index j is C_ij/sqrt(C_jj) = <deltax deltatheta>/sqrt(<deltatheta^2>)
-        v = self._gather_poi_noi_vector(self.cov)
-        impacts = v / tf.reshape(tf.sqrt(tf.linalg.diag_part(self.cov)), [1, -1])
-
         nstat = self.poi_model.npoi + self.indata.nsystnoconstraint
-        hess_stat = hess[:nstat, :nstat]
-        inv_hess_stat = tf.linalg.inv(hess_stat)
+
+        if self.binByBinStatMode == "full" and self.binByBinStatType == "gamma":
+            # strip off explicit BB parameters
+            cov = self.cov[
+                : self.poi_model.npoi + self.indata.nsyst,
+                : self.poi_model.npoi + self.indata.nsyst,
+            ]
+            # explicit BB parameters are unconstrained, i.e. stat uncertainty
+            idx_stat = tf.concat(
+                [
+                    tf.range(nstat),
+                    tf.range(
+                        self.poi_model.npoi + self.indata.nsyst,
+                        self.poi_model.npoi + self.indata.nsyst + self.indata.nbins,
+                    ),
+                ],
+                axis=0,
+            )
+            hess_stat = tf.gather(tf.gather(hess, idx_stat, axis=0), idx_stat, axis=1)
+        else:
+            cov = self.cov
+            hess_stat = hess[:nstat, :nstat]
+
+        v = self._gather_poi_noi_vector(cov)
+        impacts = v / tf.reshape(tf.sqrt(tf.linalg.diag_part(cov)), [1, -1])
+        inv_hess_stat = tf.linalg.inv(hess_stat)[:nstat, :nstat]
 
         if self.binByBinStat:
             # impact bin-by-bin stat
@@ -1071,6 +1092,8 @@ def global_impacts_parms(self):
             impacts_grouped_syst = tf.transpose(impacts_grouped_syst)
             impacts_grouped = tf.concat([impacts_grouped_syst, impacts_grouped], axis=1)
 
+        # strip off explicit BB parameters if available
+        impacts = impacts[:, : self.indata.nsyst]
         return impacts, impacts_grouped
 
     def _pd2ldbeta2(self, profile=False):
@@ -1302,6 +1325,8 @@ def compute_derivatives(dvars):
                     [impacts_grouped_syst, impacts_grouped], axis=-1
                 )
 
+            # strip off explicit BB parameters if available
+            impacts = impacts[:, : self.indata.nsyst]
             impacts = tf.reshape(impacts, [*expvar.shape, impacts.shape[-1]])
             impacts_grouped = tf.reshape(
                 impacts_grouped, [*expvar.shape, impacts_grouped.shape[-1]]
@@ -1463,7 +1488,6 @@ def _compute_yields_with_beta(self, profile=True, compute_norm=False, full=True)
 
                 if self.chisqFit:
                     if self.binByBinStatType == "gamma":
-
                         kstat = self.kstat[: self.indata.nbins]
                         if self.binByBinStatMode == "lite":
                             abeta = nexp_profile**2
@@ -1471,15 +1495,19 @@ def _compute_yields_with_beta(self, profile=True, compute_norm=False, full=True)
                             cbeta = -kstat * self.varnobs * beta0
                             beta = solve_quad_eq(abeta, bbeta, cbeta)
                         elif self.binByBinStatMode == "full":
-                            raise NotImplementedError(
-                                "Barlow-Beeston full with gamma not yet implemented in chisqFit"
-                            )
-
+                            norm_profile = norm[: self.indata.nbins]
                             nbeta = self.x[self.poi_model.npoi + self.indata.nsyst :]
-
-                            # individual beta parameter from Gamma distribution
-                            # TODO
-
+                            beta = (
+                                kstat
+                                * beta0
+                                / (
+                                    ((self.nobs - nexp_profile * nbeta) / self.varnobs)[
+                                        ..., None
+                                    ]
+                                    * norm_profile
+                                    + kstat
+                                )
+                            )
                     elif self.binByBinStatType == "normal-multiplicative":
                         kstat = self.kstat[: self.indata.nbins]
                         if self.binByBinStatMode == "lite":
@@ -1622,8 +1650,6 @@ def _compute_yields_with_beta(self, profile=True, compute_norm=False, full=True)
                         elif self.binByBinStatMode == "full":
                             norm_profile = norm[: self.indata.nbins]
                             nbeta = self.x[self.poi_model.npoi + self.indata.nsyst :]
-
-                            # individual beta parameter from Gamma distribution
                             beta = (
                                 kstat
                                 * beta0
@@ -1634,7 +1660,6 @@ def _compute_yields_with_beta(self, profile=True, compute_norm=False, full=True)
                                     + kstat
                                 )
                             )
-
                     elif self.binByBinStatType == "normal-multiplicative":
                         kstat = self.kstat[: self.indata.nbins]
                         if self.binByBinStatMode == "lite":

From 72842e716f73dc9e4a5d5859e25d4019a8e18715 Mon Sep 17 00:00:00 2001
From: davidwalter2 <david.walter@cern.ch>
Date: Sun, 4 Jan 2026 11:18:30 -0500
Subject: [PATCH 5/5] Return None callback in case of analytic solution

---
 bin/rabbit_fit.py | 3 ++-
 rabbit/fitter.py  | 2 ++
 2 files changed, 4 insertions(+), 1 deletion(-)

diff --git a/bin/rabbit_fit.py b/bin/rabbit_fit.py
index a8e377a..58d7170 100755
--- a/bin/rabbit_fit.py
+++ b/bin/rabbit_fit.py
@@ -280,7 +280,8 @@ def fit(args, fitter, ws, dofit=True):
         if dofit:
             cb = fitter.minimize()
 
-            ws.add_loss_time_hist(cb.loss_history, cb.time_history)
+            if cb is not None:
+                ws.add_loss_time_hist(cb.loss_history, cb.time_history)
 
         if not args.noHessian:
             # compute the covariance matrix and estimated distance to minimum
diff --git a/rabbit/fitter.py b/rabbit/fitter.py
index a6a9605..61896e2 100644
--- a/rabbit/fitter.py
+++ b/rabbit/fitter.py
@@ -2192,6 +2192,8 @@ def minimize(self):
             del chol
 
             self.x.assign_add(dx)
+
+            callback = None
         else:
 
             def scipy_loss(xval):