diff --git a/.DS_Store b/.DS_Store
new file mode 100644
index 00000000..4d78fc8f
Binary files /dev/null and b/.DS_Store differ
diff --git a/.gitignore b/.gitignore
index 38af2255..0acbd9ee 100644
--- a/.gitignore
+++ b/.gitignore
@@ -14,3 +14,4 @@ issues/
 abacusnbody/metadata/abacussummit_headers.asdf
 *-jvsc-*.ipynb
 *~
+abacusnbody/hod/CSMF_HOD.py
diff --git a/abacusnbody/.DS_Store b/abacusnbody/.DS_Store
new file mode 100644
index 00000000..810d60f9
Binary files /dev/null and b/abacusnbody/.DS_Store differ
diff --git a/abacusnbody/hod/.DS_Store b/abacusnbody/hod/.DS_Store
new file mode 100644
index 00000000..be3feb43
Binary files /dev/null and b/abacusnbody/hod/.DS_Store differ
diff --git a/abacusnbody/hod/CSMF_HOD.py b/abacusnbody/hod/CSMF_HOD.py
new file mode 100644
index 00000000..a20777c8
--- /dev/null
+++ b/abacusnbody/hod/CSMF_HOD.py
@@ -0,0 +1,1338 @@
+import math
+import os
+import time
+import warnings
+
+import numba
+import numba as nb
+import numpy as np
+from astropy.io import ascii
+from astropy.table import Table
+from numba import njit, types
+from numba.typed import Dict
+
+# import yaml
+# config = yaml.safe_load(open('config/abacus_hod.yaml'))
+# numba.set_num_threads(16)
+float_array = types.float64[:]
+int_array = types.int64[:]
+G = 4.302e-6  # in kpc/Msol (km.s)^2
+
+
+@njit(fastmath=True)
+def n_cen_CSMF(M_h, Mstar_low, Mstar_up, M_1, M_0, gamma1, gamma2, sigma_c):
+    """
+    Standard Cacciato et al. (2008) centrals HOD parametrization for CSMF
+    """
+    M_c_value = M_c(M_h, M_1, M_0, gamma1, gamma2)
+    x_low = np.log10(Mstar_low / M_c_value) / (1.41421356 * sigma_c)
+    x_up = np.log10(Mstar_up / M_c_value) / (1.41421356 * sigma_c)
+
+    return 0.5 * (math.erf(x_up) - math.erf(x_low))
+
+
+@njit(fastmath=True)
+def CSMF_centrals(M_h, Mstar, M_1, M_0, gamma1, gamma2, sigma_c):
+    """
+    Eq. (34) from Cacciato et al. (2008)
+    """
+
+    M_c_value = M_c(M_h, M_1, M_0, gamma1, gamma2)
+
+    return (
+        1
+        / (1.41421356 * np.sqrt(np.pi) * np.log(10) * sigma_c * Mstar)
+        * np.exp(-((np.log10(Mstar) - np.log10(M_c_value)) ** 2) / (2 * sigma_c**2))
+    )
+
+
+@njit(fastmath=True)
+def M_c(M_h, M_1, M_0, gamma1, gamma2):
+    """
+    Eq. (37) from Cacciato et al. (2008)
+    """
+    return M_0 * (M_h / M_1) ** gamma1 / (1 + M_h / M_1) ** (gamma1 - gamma2)
+
+
+@njit(fastmath=True)
+def get_random_cen_stellarmass(
+    M_h, Mstar_low, Mstar_up, M_1, M_0, gamma1, gamma2, sigma_c
+):
+    nbins = 1000
+    stellarmass = np.logspace(np.log10(Mstar_low), np.log10(Mstar_up), nbins)
+    stellarmass_centers = stellarmass[1:] / 2 + stellarmass[:-1] / 2
+    delta_stellar_masses = stellarmass[1:] - stellarmass[:-1]
+
+    CSMF_cen = CSMF_centrals(
+        M_h, stellarmass_centers, M_1, M_0, gamma1, gamma2, sigma_c
+    )
+
+    cdf = np.cumsum(CSMF_cen * delta_stellar_masses)
+    cdf = cdf / cdf[-1]
+
+    random_rv = np.random.uniform(cdf.min(), cdf.max())
+    bin_clostest = (np.abs(cdf - random_rv)).argmin()
+
+    return np.random.uniform(stellarmass[bin_clostest], stellarmass[bin_clostest + 1])
+
+
+@njit(fastmath=True)
+def get_random_cen_stellarmass_linearinterpolation(
+    M_h, Mstar_low, Mstar_up, M_1, M_0, gamma1, gamma2, sigma_c
+):
+    nbins = 1000
+    stellarmass = np.logspace(np.log10(Mstar_low), np.log10(Mstar_up), nbins)
+    # stellarmass_centers = stellarmass[1:]/2+stellarmass[:-1]/2
+    delta_stellar_masses = stellarmass[1:] - stellarmass[:-1]
+
+    CSMF_cen = CSMF_centrals(M_h, stellarmass, M_1, M_0, gamma1, gamma2, sigma_c)
+
+    cdf = np.cumsum(CSMF_cen[:-1] * delta_stellar_masses)
+    cdf = cdf / cdf[-1]
+
+    random_rv = np.random.uniform(cdf.min(), cdf.max())
+    bin = np.where(cdf > random_rv)[0][0]
+
+    m = (stellarmass[bin] - stellarmass[bin - 1]) / (cdf[bin] - cdf[bin - 1])
+    return m * (random_rv - cdf[bin - 1]) + stellarmass[bin - 1]
+
+
+@njit(fastmath=True)
+def n_sat_CSMF(
+    M_h,
+    Mstar_low,
+    Mstar_up,
+    M_1,
+    M_0,
+    gamma1,
+    gamma2,
+    sigma_c,
+    a1,
+    a2,
+    M2,
+    b0,
+    b1,
+    b2,
+    delta1,
+    delta2,
+):
+    """
+    Standard Cacciato et al. (2008) satellite HOD parametrization for CSMF
+    """
+    nbins = 1000
+    stellarmass = np.logspace(np.log10(Mstar_low), np.log10(Mstar_up), nbins)
+
+    CSMF_sat = CSMF_satelites(
+        M_h,
+        stellarmass,
+        M_1,
+        M_0,
+        gamma1,
+        gamma2,
+        a1,
+        a2,
+        M2,
+        b0,
+        b1,
+        b2,
+        delta1,
+        delta2,
+    )
+
+    nsat = 0
+    for i in range(nbins - 1):
+        nsat += (CSMF_sat[i + 1] - CSMF_sat[i]) * (
+            stellarmass[i + 1] - stellarmass[i]
+        ) / 2 + (stellarmass[i + 1] - stellarmass[i]) * CSMF_sat[i]
+
+    return nsat  # *ncen
+
+
+@njit(fastmath=True)
+def CSMF_satelites(
+    M_h, Mstar, M_1, M_0, gamma1, gamma2, a1, a2, M2, b0, b1, b2, delta1, delta2
+):
+    """
+    Eq. (36) from Cacciato et al. (2008)
+    """
+    M_s_value = M_s(M_h, M_1, M_0, gamma1, gamma2)
+    alpha_s_value = alpha_s(M_h, a1, a2, M2)
+    phi_s_value = phi_s(M_h, b0, b1, b2)
+
+    delta = 10 ** (delta1 + delta2 * (np.log10(M_h) - 12))
+
+    return (
+        phi_s_value
+        / M_s_value
+        * (Mstar / M_s_value) ** alpha_s_value
+        * np.exp(-delta * (Mstar / M_s_value) ** 2)
+    )
+
+
+@njit(fastmath=True)
+def M_s(M_h, M_1, M_0, gamma1, gamma2):
+    """
+    Eq. (38) from Cacciato et al. (2008)
+    """
+    return 0.562 * M_c(M_h, M_1, M_0, gamma1, gamma2)
+
+
+@njit(fastmath=True)
+def alpha_s(M_h, a1, a2, M2):
+    """
+    Eq. (39) from Cacciato et al. (2008)
+    """
+    return -2.0 + a1 * (1 - 2 / np.pi * np.arctan(a2 * np.log10(M_h / M2)))
+
+
+@njit(fastmath=True)
+def phi_s(M_h, b0, b1, b2):
+    """
+    Eq. (40) from Cacciato et al. (2008)
+    """
+    M12 = M_h / 1e12
+    log_phi_s = b0 + b1 * np.log10(M12) + b2 * np.log10(M12) ** 2
+    return 10**log_phi_s
+
+
+@njit(fastmath=True)
+def get_random_sat_stellarmass(
+    M_h,
+    Mstar_low,
+    Mstar_up,
+    M_1,
+    M_0,
+    gamma1,
+    gamma2,
+    a1,
+    a2,
+    M2,
+    b0,
+    b1,
+    b2,
+    delta1,
+    delta2,
+):
+    nbins = 1000
+    stellarmass = np.logspace(np.log10(Mstar_low), np.log10(Mstar_up), nbins)
+    stellarmass_centers = stellarmass[1:] / 2 + stellarmass[:-1] / 2
+    delta_stellar_masses = stellarmass[1:] - stellarmass[:-1]
+
+    CSMF_sat = CSMF_satelites(
+        M_h,
+        stellarmass_centers,
+        M_1,
+        M_0,
+        gamma1,
+        gamma2,
+        a1,
+        a2,
+        M2,
+        b0,
+        b1,
+        b2,
+        delta1,
+        delta2,
+    )
+
+    cdf = np.cumsum(CSMF_sat * delta_stellar_masses)
+    cdf = cdf / cdf[-1]
+
+    random_rv = np.random.uniform(cdf.min(), cdf.max())
+    bin_clostest = (np.abs(cdf - random_rv)).argmin()
+
+    return np.random.uniform(stellarmass[bin_clostest], stellarmass[bin_clostest + 1])
+
+
+@njit(fastmath=True)
+def get_random_sat_stellarmass_linearinterpolation(
+    M_h,
+    Mstar_low,
+    Mstar_up,
+    M_1,
+    M_0,
+    gamma1,
+    gamma2,
+    a1,
+    a2,
+    M2,
+    b0,
+    b1,
+    b2,
+    delta1,
+    delta2,
+):
+    nbins = 100
+    stellarmass = np.logspace(np.log10(Mstar_low), np.log10(Mstar_up), nbins)
+    # stellarmass_centers = stellarmass[1:]/2+stellarmass[:-1]/2
+    delta_stellar_masses = stellarmass[1:] - stellarmass[:-1]
+
+    CSMF_sat = CSMF_satelites(
+        M_h,
+        stellarmass,
+        M_1,
+        M_0,
+        gamma1,
+        gamma2,
+        a1,
+        a2,
+        M2,
+        b0,
+        b1,
+        b2,
+        delta1,
+        delta2,
+    )
+
+    cdf = np.cumsum(CSMF_sat[:-1] * delta_stellar_masses)
+    cdf = cdf / cdf[-1]
+
+    random_rv = np.random.uniform(cdf.min(), cdf.max())
+    bin = np.where(cdf > random_rv)[0][0]
+
+    m = (stellarmass[bin] - stellarmass[bin - 1]) / (cdf[bin] - cdf[bin - 1])
+    return m * (random_rv - cdf[bin - 1]) + stellarmass[bin - 1]
+
+
+@njit(fastmath=True)
+def Gaussian_fun(x, mean, sigma):
+    """
+    Gaussian function with centered at `mean' with standard deviation `sigma'.
+    """
+    return 0.3989422804014327 / sigma * np.exp(-((x - mean) ** 2) / 2 / sigma**2)
+
+
+@njit(fastmath=True)
+def wrap(x, L):
+    """Fast scalar mod implementation"""
+    L2 = L / 2
+    if x >= L2:
+        return x - L
+    elif x < -L2:
+        return x + L
+    return x
+
+
+@njit(parallel=True, fastmath=True)
+def gen_cent(
+    pos,
+    vel,
+    mass,
+    ids,
+    multis,
+    randoms,
+    vdev,
+    deltac,
+    fenv,
+    shear,
+    CSMF_hod_dict,
+    rsd,
+    inv_velz2kms,
+    lbox,
+    want_CSMF,
+    Nthread,
+    origin,
+):
+    """
+    Generate central galaxies in place in memory with a two pass numba parallel implementation.
+    """
+    if want_CSMF:
+        Mstar_low_C, Mstar_up_C, M_1_C, M_0_C, gamma1_C, gamma2_C, sigma_c_C = (
+            CSMF_hod_dict['Mstar_low'],
+            CSMF_hod_dict['Mstar_up'],
+            CSMF_hod_dict['M_1'],
+            CSMF_hod_dict['M_0'],
+            CSMF_hod_dict['gamma_1'],
+            CSMF_hod_dict['gamma_2'],
+            CSMF_hod_dict['sigma_c'],
+        )
+        ic_C, alpha_c_C, Ac_C, Bc_C = (
+            CSMF_hod_dict['ic'],
+            CSMF_hod_dict['alpha_c'],
+            CSMF_hod_dict['Acent'],
+            CSMF_hod_dict['Bcent'],
+        )
+
+    H = len(mass)
+
+    numba.set_num_threads(Nthread)
+    Nout = np.zeros((Nthread, 1, 8), dtype=np.int64)
+    hstart = np.rint(np.linspace(0, H, Nthread + 1)).astype(
+        np.int64
+    )  # starting index of each thread
+
+    keep = np.empty(H, dtype=np.int8)  # mask array tracking which halos to keep
+
+    # figuring out the number of halos kept for each thread
+    for tid in numba.prange(Nthread):
+        for i in range(hstart[tid], hstart[tid + 1]):
+            # first create the markers between 0 and 1 for different tracers
+            CSMF_marker = 0
+            if want_CSMF:
+                M_1_C_temp = 10 ** (np.log10(M_1_C) + Ac_C * deltac[i] + Bc_C * fenv[i])
+
+                ncen = n_cen_CSMF(
+                    mass[i],
+                    Mstar_low_C,
+                    Mstar_up_C,
+                    M_1_C_temp,
+                    M_0_C,
+                    gamma1_C,
+                    gamma2_C,
+                    sigma_c_C,
+                )
+
+                CSMF_marker += ncen * ic_C * multis[i]
+
+            if randoms[i] <= CSMF_marker:
+                Nout[tid, 0, 0] += 1  # counting
+                keep[i] = 1
+            else:
+                keep[i] = 0
+
+    # compose galaxy array, first create array of galaxy starting indices for the threads
+    gstart = np.empty((Nthread + 1, 1), dtype=np.int64)
+    gstart[0, :] = 0
+    gstart[1:, 0] = Nout[:, 0, 0].cumsum()
+
+    # galaxy arrays
+    N_CSMF = gstart[-1, 0]
+    CSMF_x = np.empty(N_CSMF, dtype=mass.dtype)
+    CSMF_y = np.empty(N_CSMF, dtype=mass.dtype)
+    CSMF_z = np.empty(N_CSMF, dtype=mass.dtype)
+    CSMF_vx = np.empty(N_CSMF, dtype=mass.dtype)
+    CSMF_vy = np.empty(N_CSMF, dtype=mass.dtype)
+    CSMF_vz = np.empty(N_CSMF, dtype=mass.dtype)
+    CSMF_mass = np.empty(N_CSMF, dtype=mass.dtype)
+    CSMF_stellarmass = np.empty(N_CSMF, dtype=mass.dtype)
+    CSMF_id = np.empty(N_CSMF, dtype=ids.dtype)
+
+    # fill in the galaxy arrays
+    for tid in numba.prange(Nthread):
+        j1 = gstart[tid]
+        for i in range(hstart[tid], hstart[tid + 1]):
+            if keep[i] == 1:
+                # loop thru three directions to assign galaxy velocities and positions
+                CSMF_x[j1] = pos[i, 0]
+                CSMF_vx[j1] = vel[i, 0] + alpha_c_C * vdev[i, 0]  # velocity bias
+                CSMF_y[j1] = pos[i, 1]
+                CSMF_vy[j1] = vel[i, 1] + alpha_c_C * vdev[i, 1]  # velocity bias
+                CSMF_z[j1] = pos[i, 2]
+                CSMF_vz[j1] = vel[i, 2] + alpha_c_C * vdev[i, 2]  # velocity bias
+
+                # rsd only applies to the z direction
+                if rsd and origin is not None:
+                    nx = CSMF_x[j1] - origin[0]
+                    ny = CSMF_y[j1] - origin[1]
+                    nz = CSMF_z[j1] - origin[2]
+                    inv_norm = 1.0 / np.sqrt(nx * nx + ny * ny + nz * nz)
+                    nx *= inv_norm
+                    ny *= inv_norm
+                    nz *= inv_norm
+                    proj = inv_velz2kms * (
+                        CSMF_vx[j1] * nx + CSMF_vy[j1] * ny + CSMF_vz[j1] * nz
+                    )
+                    CSMF_x[j1] = CSMF_x[j1] + proj * nx
+                    CSMF_y[j1] = CSMF_y[j1] + proj * ny
+                    CSMF_z[j1] = CSMF_z[j1] + proj * nz
+                elif rsd:
+                    CSMF_z[j1] = wrap(pos[i, 2] + CSMF_vz[j1] * inv_velz2kms, lbox)
+
+                CSMF_mass[j1] = mass[i]
+                M_1_C_temp = 10 ** (np.log10(M_1_C) + Ac_C * deltac[i] + Bc_C * fenv[i])
+                CSMF_stellarmass[j1] = get_random_cen_stellarmass_linearinterpolation(
+                    mass[i],
+                    Mstar_low_C,
+                    Mstar_up_C,
+                    M_1_C_temp,
+                    M_0_C,
+                    gamma1_C,
+                    gamma2_C,
+                    sigma_c_C,
+                )
+                CSMF_id[j1] = ids[i]
+                j1 += 1
+        # assert j == gstart[tid + 1]
+
+    CSMF_dict = Dict.empty(key_type=types.unicode_type, value_type=float_array)
+    ID_dict = Dict.empty(key_type=types.unicode_type, value_type=int_array)
+
+    CSMF_dict['x'] = CSMF_x
+    CSMF_dict['y'] = CSMF_y
+    CSMF_dict['z'] = CSMF_z
+    CSMF_dict['vx'] = CSMF_vx
+    CSMF_dict['vy'] = CSMF_vy
+    CSMF_dict['vz'] = CSMF_vz
+    CSMF_dict['mass'] = CSMF_mass
+    CSMF_dict['stellarmass'] = CSMF_stellarmass
+    ID_dict['CSMF'] = CSMF_id
+    return CSMF_dict, ID_dict, keep
+
+
+@njit(parallel=True, fastmath=True)
+def getPointsOnSphere(nPoints, Nthread, seed=None):
+    """
+    --- Aiding function for NFW computation, generate random points in a sphere
+    """
+    numba.set_num_threads(Nthread)
+    ind = min(Nthread, nPoints)
+    # starting index of each thread
+    hstart = np.rint(np.linspace(0, nPoints, ind + 1))
+    ur = np.zeros((nPoints, 3), dtype=np.float64)
+    cmin = -1
+    cmax = +1
+
+    for tid in numba.prange(Nthread):
+        if seed is not None:
+            np.random.seed(seed[tid])
+        for i in range(hstart[tid], hstart[tid + 1]):
+            u1, u2 = np.random.uniform(0, 1), np.random.uniform(0, 1)
+            ra = 0 + u1 * (2 * np.pi - 0)
+            dec = np.pi - (np.arccos(cmin + u2 * (cmax - cmin)))
+
+            ur[i, 0] = np.sin(dec) * np.cos(ra)
+            ur[i, 1] = np.sin(dec) * np.sin(ra)
+            ur[i, 2] = np.cos(dec)
+    return ur
+
+
+@njit(fastmath=True, parallel=True)  # parallel=True,
+def compute_fast_NFW(
+    NFW_draw,
+    h_id,
+    x_h,
+    y_h,
+    z_h,
+    vx_h,
+    vy_h,
+    vz_h,
+    vrms_h,
+    c,
+    M,
+    Rvir,
+    rd_pos,
+    num_sat,
+    f_sigv,
+    vel_sat='rd_normal',
+    Nthread=16,
+    exp_frac=0,
+    exp_scale=1,
+    nfw_rescale=1,
+):
+    """
+    --- Compute NFW positions and velocities for satelitte galaxies
+    c: r98/r25
+    vrms_h: 'sigmav3d_L2com'
+    """
+    # numba.set_num_threads(Nthread)
+    # figuring out the number of halos kept for each thread
+    h_id = np.repeat(h_id, num_sat)
+    M = np.repeat(M, num_sat)
+    c = np.repeat(c, num_sat)
+    Rvir = np.repeat(Rvir, num_sat)
+    x_h = np.repeat(x_h, num_sat)
+    y_h = np.repeat(y_h, num_sat)
+    z_h = np.repeat(z_h, num_sat)
+    vx_h = np.repeat(vx_h, num_sat)
+    vy_h = np.repeat(vy_h, num_sat)
+    vz_h = np.repeat(vz_h, num_sat)
+    vrms_h = np.repeat(vrms_h, num_sat)
+    x_sat = np.empty_like(x_h)
+    y_sat = np.empty_like(y_h)
+    z_sat = np.empty_like(z_h)
+    vx_sat = np.empty_like(vx_h)
+    vy_sat = np.empty_like(vy_h)
+    vz_sat = np.empty_like(vz_h)
+
+    # starting index of each thread
+    hstart = np.rint(np.linspace(0, num_sat.sum(), Nthread + 1))
+    for tid in numba.prange(Nthread):
+        for i in range(int(hstart[tid]), int(hstart[tid + 1])):
+            ind = i
+            # while (NFW_draw[ind] > c[i]):
+            #    ind = np.random.randint(0, len(NFW_draw))
+            # etaVir = NFW_draw[ind]/c[i]  # =r/rvir
+            if np.random.uniform(0, 1) < exp_frac:
+                tt = np.random.exponential(exp_scale, size=1)[0]
+                etaVir = tt / c[i]
+            else:
+                while NFW_draw[ind] > c[i]:
+                    ind = np.random.randint(0, len(NFW_draw))
+                etaVir = NFW_draw[ind] / c[i] * nfw_rescale
+
+            p = etaVir * Rvir[i]
+            x_sat[i] = x_h[i] + rd_pos[i, 0] * p
+            y_sat[i] = y_h[i] + rd_pos[i, 1] * p
+            z_sat[i] = z_h[i] + rd_pos[i, 2] * p
+            if vel_sat == 'rd_normal':
+                sig = vrms_h[i] * 0.577 * f_sigv
+                vx_sat[i] = np.random.normal(loc=vx_h[i], scale=sig)
+                vy_sat[i] = np.random.normal(loc=vy_h[i], scale=sig)
+                vz_sat[i] = np.random.normal(loc=vz_h[i], scale=sig)
+            else:
+                raise ValueError('Wrong vel_sat argument only "rd_normal"')
+    return h_id, x_sat, y_sat, z_sat, vx_sat, vy_sat, vz_sat, M
+
+
+@njit(fastmath=True, parallel=True)
+def gen_sats_nfw(
+    NFW_draw,
+    hpos,
+    hvel,
+    hmass,
+    hid,
+    hdeltac,
+    hfenv,
+    hshear,
+    hvrms,
+    hc,
+    hrvir,
+    CSMF_hod_dict,
+    want_CSMF,
+    rsd,
+    inv_velz2kms,
+    lbox,
+    keep_cent,
+    vel_sat='rd_normal',
+    Nthread=16,
+):
+    """
+    Generate satellite galaxies on an NFW profile, with option for an extended profile. See Rocher et al. 2023.
+
+    Not yet on lightcone!! Different velocity bias treatment!! Not built for performance!!
+
+    """
+    if want_CSMF:
+        (
+            Mstar_low_C,
+            Mstar_up_C,
+            M_1_C,
+            M_0_C,
+            gamma1_C,
+            gamma2_C,
+            sigma_c_C,
+            a1_C,
+            a2_C,
+            M2_C,
+            b0_C,
+            b1_C,
+            b2_C,
+            delta1_C,
+            delta2_C,
+        ) = (
+            CSMF_hod_dict['Mstar_low'],
+            CSMF_hod_dict['Mstar_up'],
+            CSMF_hod_dict['M_1'],
+            CSMF_hod_dict['M_0'],
+            CSMF_hod_dict['gamma_1'],
+            CSMF_hod_dict['gamma_2'],
+            CSMF_hod_dict['sigma_c'],
+            CSMF_hod_dict['a_1'],
+            CSMF_hod_dict['a_2'],
+            CSMF_hod_dict['M_2'],
+            CSMF_hod_dict['b_0'],
+            CSMF_hod_dict['b_1'],
+            CSMF_hod_dict['b_2'],
+            CSMF_hod_dict['delta_1'],
+            CSMF_hod_dict['delta_2'],
+        )
+        Ac_C, As_C, Bc_C, Bs_C, ic_C = (
+            CSMF_hod_dict['Acent'],
+            CSMF_hod_dict['Asat'],
+            CSMF_hod_dict['Bcent'],
+            CSMF_hod_dict['Bsat'],
+            CSMF_hod_dict['ic'],
+        )
+        f_sigv_C = CSMF_hod_dict['f_sigv']
+
+    numba.set_num_threads(Nthread)
+
+    # compute nsate for each halo
+    # figuring out the number of particles kept for each thread
+    num_sats_C = np.zeros(len(hid), dtype=np.int64)
+    stellarmass_C = np.zeros(len(hid), dtype=np.int64)
+    hstart = np.rint(np.linspace(0, len(hid), Nthread + 1)).astype(
+        np.int64
+    )  # starting index of each thread
+    for tid in range(Nthread):
+        for i in range(hstart[tid], hstart[tid + 1]):
+            if want_CSMF:
+                M_1_C_temp = 10 ** (
+                    np.log10(M_1_C) + Ac_C * hdeltac[i] + Bc_C * hfenv[i]
+                )
+                a1_C_temp = a1_C + As_C * hdeltac[i] + Bs_C * hfenv[i]
+                base_p_C = (
+                    n_sat_CSMF(
+                        hmass[i],
+                        Mstar_low_C,
+                        Mstar_up_C,
+                        M_1_C_temp,
+                        M_0_C,
+                        gamma1_C,
+                        gamma2_C,
+                        sigma_c_C,
+                        a1_C_temp,
+                        a2_C,
+                        M2_C,
+                        b0_C,
+                        b1_C,
+                        b2_C,
+                        delta1_C,
+                        delta2_C,
+                    )
+                    * ic_C
+                )
+                num_sats_C[i] = np.random.poisson(base_p_C)
+
+    # generate rdpos
+    rd_pos_C = getPointsOnSphere(np.sum(num_sats_C), Nthread)
+
+    # put satellites on NFW
+    h_id_C, x_sat_C, y_sat_C, z_sat_C, vx_sat_C, vy_sat_C, vz_sat_C, M_C = (
+        compute_fast_NFW(
+            NFW_draw,
+            hid,
+            hpos[:, 0],
+            hpos[:, 1],
+            hpos[:, 2],
+            hvel[:, 0],
+            hvel[:, 1],
+            hvel[:, 2],
+            hvrms,
+            hc,
+            hmass,
+            hrvir,
+            rd_pos_C,
+            num_sats_C,
+            f_sigv_C,
+            vel_sat,
+            Nthread,
+        )
+    )
+
+    # do rsd
+    if rsd:
+        z_sat_C = (z_sat_C + vz_sat_C * inv_velz2kms) % lbox
+
+    CSMF_dict = Dict.empty(key_type=types.unicode_type, value_type=float_array)
+    ID_dict = Dict.empty(key_type=types.unicode_type, value_type=int_array)
+
+    CSMF_dict['x'] = x_sat_C
+    CSMF_dict['y'] = y_sat_C
+    CSMF_dict['z'] = z_sat_C
+    CSMF_dict['vx'] = vx_sat_C
+    CSMF_dict['vy'] = vy_sat_C
+    CSMF_dict['vz'] = vz_sat_C
+    CSMF_dict['mass'] = M_C
+    stellarmass_C = np.empty_like(M_C)
+    ## compute stellarmass of all the satelites
+    if want_CSMF:
+        hstart = np.rint(np.linspace(0, num_sats_C.sum(), Nthread + 1))
+        for tid in numba.prange(Nthread):
+            for i in range(int(hstart[tid]), int(hstart[tid + 1])):
+                M_1_C_temp = 10 ** (
+                    np.log10(M_1_C) + Ac_C * hdeltac[i] + Bc_C * hfenv[i]
+                )
+                a1_C_temp = a1_C + As_C * hdeltac[i] + Bs_C * hfenv[i]
+                stellarmass_C[i] = get_random_sat_stellarmass_linearinterpolation(
+                    M_C[i],
+                    Mstar_low_C,
+                    Mstar_up_C,
+                    M_1_C_temp,
+                    M_0_C,
+                    gamma1_C,
+                    gamma2_C,
+                    a1_C_temp,
+                    a2_C,
+                    M2_C,
+                    b0_C,
+                    b1_C,
+                    b2_C,
+                    delta1_C,
+                    delta2_C,
+                )
+
+    CSMF_dict['stellarmass'] = stellarmass_C
+    ID_dict['CSMF'] = h_id_C
+
+    return CSMF_dict, ID_dict
+
+
+@njit(parallel=True, fastmath=True)
+def gen_sats(
+    ppos,
+    pvel,
+    hvel,
+    hmass,
+    hid,
+    weights,
+    randoms,
+    hdeltac,
+    hfenv,
+    hshear,
+    enable_ranks,
+    ranks,
+    ranksv,
+    ranksp,
+    ranksr,
+    ranksc,
+    CSMF_hod_dict,
+    rsd,
+    inv_velz2kms,
+    lbox,
+    Mpart,
+    want_CSMF,
+    Nthread,
+    origin,
+    keep_cent,
+):
+    """
+    Generate satellite galaxies in place in memory with a two pass numba parallel implementation.
+    """
+
+    if want_CSMF:
+        (
+            Mstar_low_C,
+            Mstar_up_C,
+            M_1_C,
+            M_0_C,
+            gamma1_C,
+            gamma2_C,
+            sigma_c_C,
+            a1_C,
+            a2_C,
+            M2_C,
+            b0_C,
+            b1_C,
+            b2_C,
+            delta1_C,
+            delta2_C,
+        ) = (
+            CSMF_hod_dict['Mstar_low'],
+            CSMF_hod_dict['Mstar_up'],
+            CSMF_hod_dict['M_1'],
+            CSMF_hod_dict['M_0'],
+            CSMF_hod_dict['gamma_1'],
+            CSMF_hod_dict['gamma_2'],
+            CSMF_hod_dict['sigma_c'],
+            CSMF_hod_dict['a_1'],
+            CSMF_hod_dict['a_2'],
+            CSMF_hod_dict['M_2'],
+            CSMF_hod_dict['b_0'],
+            CSMF_hod_dict['b_1'],
+            CSMF_hod_dict['b_2'],
+            CSMF_hod_dict['delta_1'],
+            CSMF_hod_dict['delta_2'],
+        )
+
+        alpha_s_C, s_C, s_v_C, s_p_C, s_r_C, Ac_C, As_C, Bc_C, Bs_C, ic_C = (
+            CSMF_hod_dict['alpha_s'],
+            CSMF_hod_dict['s'],
+            CSMF_hod_dict['s_v'],
+            CSMF_hod_dict['s_p'],
+            CSMF_hod_dict['s_r'],
+            CSMF_hod_dict['Acent'],
+            CSMF_hod_dict['Asat'],
+            CSMF_hod_dict['Bcent'],
+            CSMF_hod_dict['Bsat'],
+            CSMF_hod_dict['ic'],
+        )
+
+    H = len(hmass)  # num of particles
+
+    numba.set_num_threads(Nthread)
+    Nout = np.zeros((Nthread, 1, 8), dtype=np.int64)
+    hstart = np.rint(np.linspace(0, H, Nthread + 1)).astype(
+        np.int64
+    )  # starting index of each thread
+
+    keep = np.empty(H, dtype=np.int8)  # mask array tracking which halos to keep
+
+    # figuring out the number of particles kept for each thread
+    for tid in numba.prange(Nthread):  # numba.prange(Nthread):
+        for i in range(hstart[tid], hstart[tid + 1]):
+            # print(logM1, As, hdeltac[i], Bs, hfenv[i])
+            CSMF_marker = 0
+            if want_CSMF:
+                M_1_C_temp = 10 ** (
+                    np.log10(M_1_C) + Ac_C * hdeltac[i] + Bc_C * hfenv[i]
+                )
+                a1_C_temp = a1_C + As_C * hdeltac[i] + Bs_C * hfenv[i]
+                base_p_C = (
+                    n_sat_CSMF(
+                        hmass[i],
+                        Mstar_low_C,
+                        Mstar_up_C,
+                        M_1_C_temp,
+                        M_0_C,
+                        gamma1_C,
+                        gamma2_C,
+                        sigma_c_C,
+                        a1_C_temp,
+                        a2_C,
+                        M2_C,
+                        b0_C,
+                        b1_C,
+                        b2_C,
+                        delta1_C,
+                        delta2_C,
+                    )
+                    * weights[i]
+                    * ic_C
+                )
+                if enable_ranks:
+                    decorator_C = (
+                        1
+                        + s_C * ranks[i]
+                        + s_v_C * ranksv[i]
+                        + s_p_C * ranksp[i]
+                        + s_r_C * ranksr[i]
+                    )
+                    exp_sat = base_p_C * decorator_C
+                else:
+                    exp_sat = base_p_C
+                CSMF_marker += exp_sat
+
+            if randoms[i] <= CSMF_marker:
+                Nout[tid, 0, 0] += 1  # counting
+                keep[i] = 1
+            else:
+                keep[i] = 0
+
+    # compose galaxy array, first create array of galaxy starting indices for the threads
+    gstart = np.empty((Nthread + 1, 1), dtype=np.int64)
+    gstart[0, :] = 0
+    gstart[1:, 0] = Nout[:, 0, 0].cumsum()
+
+    # galaxy arrays
+    N_CSMF = gstart[-1, 0]
+    CSMF_x = np.empty(N_CSMF, dtype=hmass.dtype)
+    CSMF_y = np.empty(N_CSMF, dtype=hmass.dtype)
+    CSMF_z = np.empty(N_CSMF, dtype=hmass.dtype)
+    CSMF_vx = np.empty(N_CSMF, dtype=hmass.dtype)
+    CSMF_vy = np.empty(N_CSMF, dtype=hmass.dtype)
+    CSMF_vz = np.empty(N_CSMF, dtype=hmass.dtype)
+    CSMF_mass = np.empty(N_CSMF, dtype=hmass.dtype)
+    CSMF_stellarmass = np.empty(N_CSMF, dtype=hmass.dtype)
+    CSMF_id = np.empty(N_CSMF, dtype=hid.dtype)
+
+    # fill in the galaxy arrays
+    for tid in numba.prange(Nthread):
+        j1 = gstart[tid]
+        for i in range(hstart[tid], hstart[tid + 1]):
+            if keep[i] == 1:
+                CSMF_x[j1] = ppos[i, 0]
+                CSMF_vx[j1] = hvel[i, 0] + alpha_s_C * (
+                    pvel[i, 0] - hvel[i, 0]
+                )  # velocity bias
+                CSMF_y[j1] = ppos[i, 1]
+                CSMF_vy[j1] = hvel[i, 1] + alpha_s_C * (
+                    pvel[i, 1] - hvel[i, 1]
+                )  # velocity bias
+                CSMF_z[j1] = ppos[i, 2]
+                CSMF_vz[j1] = hvel[i, 2] + alpha_s_C * (
+                    pvel[i, 2] - hvel[i, 2]
+                )  # velocity bias
+                if rsd and origin is not None:
+                    nx = CSMF_x[j1] - origin[0]
+                    ny = CSMF_y[j1] - origin[1]
+                    nz = CSMF_z[j1] - origin[2]
+                    inv_norm = 1.0 / np.sqrt(nx * nx + ny * ny + nz * nz)
+                    nx *= inv_norm
+                    ny *= inv_norm
+                    nz *= inv_norm
+                    proj = inv_velz2kms * (
+                        CSMF_vx[j1] * nx + CSMF_vy[j1] * ny + CSMF_vz[j1] * nz
+                    )
+                    CSMF_x[j1] = CSMF_x[j1] + proj * nx
+                    CSMF_y[j1] = CSMF_y[j1] + proj * ny
+                    CSMF_z[j1] = CSMF_z[j1] + proj * nz
+                elif rsd:
+                    CSMF_z[j1] = wrap(CSMF_z[j1] + CSMF_vz[j1] * inv_velz2kms, lbox)
+
+                M_1_C_temp = 10 ** (
+                    np.log10(M_1_C) + Ac_C * hdeltac[i] + Bc_C * hfenv[i]
+                )
+                a1_C_temp = a1_C + As_C * hdeltac[i] + Bs_C * hfenv[i]
+                CSMF_stellarmass[j1] = get_random_sat_stellarmass(
+                    hmass[i],
+                    Mstar_low_C,
+                    Mstar_up_C,
+                    M_1_C_temp,
+                    M_0_C,
+                    gamma1_C,
+                    gamma2_C,
+                    a1_C_temp,
+                    a2_C,
+                    M2_C,
+                    b0_C,
+                    b1_C,
+                    b2_C,
+                    delta1_C,
+                    delta2_C,
+                )
+                CSMF_mass[j1] = hmass[i]
+                CSMF_id[j1] = hid[i]
+                j1 += 1
+        # assert j == gstart[tid + 1]
+
+    CSMF_dict = Dict.empty(key_type=types.unicode_type, value_type=float_array)
+    ID_dict = Dict.empty(key_type=types.unicode_type, value_type=int_array)
+
+    CSMF_dict['x'] = CSMF_x
+    CSMF_dict['y'] = CSMF_y
+    CSMF_dict['z'] = CSMF_z
+    CSMF_dict['vx'] = CSMF_vx
+    CSMF_dict['vy'] = CSMF_vy
+    CSMF_dict['vz'] = CSMF_vz
+    CSMF_dict['mass'] = CSMF_mass
+    CSMF_dict['stellarmass'] = CSMF_stellarmass
+    ID_dict['CSMF'] = CSMF_id
+
+    return CSMF_dict, ID_dict
+
+
+@njit(parallel=True, fastmath=True)
+def fast_concatenate(array1, array2, Nthread):
+    """Fast concatenate with numba parallel"""
+
+    N1 = len(array1)
+    N2 = len(array2)
+    if N1 == 0:
+        return array2
+    elif N2 == 0:
+        return array1
+
+    final_array = np.empty(N1 + N2, dtype=array1.dtype)
+    # if one thread, then no need to parallel
+    if Nthread == 1:
+        for i in range(N1):
+            final_array[i] = array1[i]
+        for j in range(N2):
+            final_array[j + N1] = array2[j]
+        return final_array
+
+    numba.set_num_threads(Nthread)
+    Nthread1 = max(1, int(np.floor(Nthread * N1 / (N1 + N2))))
+    Nthread2 = Nthread - Nthread1
+    hstart1 = np.rint(np.linspace(0, N1, Nthread1 + 1)).astype(np.int64)
+    hstart2 = np.rint(np.linspace(0, N2, Nthread2 + 1)).astype(np.int64) + N1
+
+    for tid in numba.prange(Nthread):  # numba.prange(Nthread):
+        if tid < Nthread1:
+            for i in range(hstart1[tid], hstart1[tid + 1]):
+                final_array[i] = array1[i]
+        else:
+            for i in range(hstart2[tid - Nthread1], hstart2[tid + 1 - Nthread1]):
+                final_array[i] = array2[i - N1]
+    # final_array = np.concatenate((array1, array2))
+    return final_array
+
+
+def gen_gals(
+    halos_array,
+    subsample,
+    tracers,
+    params,
+    Nthread,
+    enable_ranks,
+    rsd,
+    verbose,
+    nfw,
+    NFW_draw=None,
+):
+    """
+    parse hod parameters, pass them on to central and satellite generators
+    and then format the results
+
+    Parameters
+    ----------
+
+    halos_array : dictionary of arrays
+        a dictionary of halo properties (pos, vel, mass, id, randoms, ...)
+
+    subsample : dictionary of arrays
+        a dictionary of particle propoerties (pos, vel, hmass, hid, Np, subsampling, randoms, ...)
+
+    tracers : dictionary of dictionaries
+        Dictionary of multi-tracer HODs
+
+    enable_ranks : boolean
+        Flag of whether to implement particle ranks.
+
+    rsd : boolean
+        Flag of whether to implement RSD.
+
+    params : dict
+        Dictionary of various simulation parameters.
+
+    """
+
+    # B.H. TODO: pass as dictionary; make what's below more succinct
+    for tracer in tracers.keys():
+        if tracer == 'CSMF':
+            CSMF_HOD = tracers[tracer]
+
+    if 'CSMF' in tracers.keys():
+        want_CSMF = True
+
+        CSMF_hod_dict = nb.typed.Dict.empty(
+            key_type=nb.types.unicode_type, value_type=nb.types.float64
+        )
+        for key, value in CSMF_HOD.items():
+            CSMF_hod_dict[key] = value
+
+        CSMF_hod_dict['Acent'] = CSMF_HOD.get('Acent', 0.0)
+        CSMF_hod_dict['Asat'] = CSMF_HOD.get('Asat', 0.0)
+        CSMF_hod_dict['Bcent'] = CSMF_HOD.get('Bcent', 0.0)
+        CSMF_hod_dict['Bsat'] = CSMF_HOD.get('Bsat', 0.0)
+        CSMF_hod_dict['ic'] = CSMF_HOD.get('ic', 1.0)
+        CSMF_hod_dict['f_sigv'] = CSMF_HOD.get('f_sigv', 0)
+
+    else:
+        want_CSMF = False
+        CSMF_hod_dict = nb.typed.Dict.empty(
+            key_type=nb.types.unicode_type, value_type=nb.types.float64
+        )
+
+    start = time.time()
+
+    velz2kms = params['velz2kms']
+    inv_velz2kms = 1 / velz2kms
+    lbox = params['Lbox']
+    origin = params['origin']
+
+    CSMF_dict_cent, ID_dict_cent, keep_cent = gen_cent(
+        halos_array['hpos'],
+        halos_array['hvel'],
+        halos_array['hmass'],
+        halos_array['hid'],
+        halos_array['hmultis'],
+        halos_array['hrandoms'],
+        halos_array['hveldev'],
+        halos_array.get('hdeltac', np.zeros(len(halos_array['hmass']))),
+        halos_array.get('hfenv', np.zeros(len(halos_array['hmass']))),
+        halos_array.get('hshear', np.zeros(len(halos_array['hmass']))),
+        CSMF_hod_dict,
+        rsd,
+        inv_velz2kms,
+        lbox,
+        want_CSMF,
+        Nthread,
+        origin,
+    )
+    if verbose:
+        print('generating centrals took ', time.time() - start)
+
+    start = time.time()
+    if nfw:
+        warnings.warn(
+            'NFW profile is unoptimized. It has different velocity bias. It does not support lightcone.'
+        )
+        CSMF_dict_sat, ID_dict_sat = gen_sats_nfw(
+            NFW_draw,
+            halos_array['hpos'],
+            halos_array['hvel'],
+            halos_array['hmass'],
+            halos_array['hid'],
+            halos_array.get('hdeltac', np.zeros(len(halos_array['hmass']))),
+            halos_array.get('hfenv', np.zeros(len(halos_array['hmass']))),
+            halos_array.get('hshear', np.zeros(len(halos_array['hmass']))),
+            halos_array['hsigma3d'],
+            halos_array['hc'],
+            halos_array['hrvir'],
+            CSMF_hod_dict,
+            want_CSMF,
+            rsd,
+            inv_velz2kms,
+            lbox,
+            keep_cent,
+            Nthread=Nthread,
+        )
+    else:
+        CSMF_dict_sat, ID_dict_sat = gen_sats(
+            subsample['ppos'],
+            subsample['pvel'],
+            subsample['phvel'],
+            subsample['phmass'],
+            subsample['phid'],
+            subsample['pweights'],
+            subsample['prandoms'],
+            subsample.get('pdeltac', np.zeros(len(subsample['phid']))),
+            subsample.get('pfenv', np.zeros(len(subsample['phid']))),
+            subsample.get('pshear', np.zeros(len(subsample['phid']))),
+            enable_ranks,
+            subsample['pranks'],
+            subsample['pranksv'],
+            subsample['pranksp'],
+            subsample['pranksr'],
+            subsample['pranksc'],
+            CSMF_hod_dict,
+            rsd,
+            inv_velz2kms,
+            lbox,
+            params['Mpart'],
+            want_CSMF,
+            Nthread,
+            origin,
+            keep_cent[subsample['pinds']],
+        )
+    if verbose:
+        print('generating satellites took ', time.time() - start)
+
+    # B.H. TODO: need a for loop above so we don't need to do this by hand
+    HOD_dict_sat = {'CSMF': CSMF_dict_sat}
+    HOD_dict_cent = {'CSMF': CSMF_dict_cent}
+
+    # do a concatenate in numba parallel
+    start = time.time()
+    HOD_dict = {}
+    for tracer in tracers:
+        tracer_dict = {'Ncent': len(HOD_dict_cent[tracer]['x'])}
+        for k in HOD_dict_cent[tracer]:
+            tracer_dict[k] = fast_concatenate(
+                HOD_dict_cent[tracer][k], HOD_dict_sat[tracer][k], Nthread
+            )
+        tracer_dict['id'] = fast_concatenate(
+            ID_dict_cent[tracer], ID_dict_sat[tracer], Nthread
+        )
+        if verbose:
+            print(tracer, 'number of galaxies ', len(tracer_dict['x']))
+            print(
+                'satellite fraction ',
+                len(HOD_dict_sat[tracer]['x']) / len(tracer_dict['x']),
+            )
+        HOD_dict[tracer] = tracer_dict
+    if verbose:
+        print('organizing outputs took ', time.time() - start)
+    return HOD_dict
+
+
+def gen_gal_cat_CSMF(
+    halo_data,
+    particle_data,
+    tracers,
+    params,
+    Nthread=16,
+    enable_ranks=False,
+    rsd=True,
+    nfw=False,
+    NFW_draw=None,
+    write_to_disk=False,
+    savedir='./',
+    verbose=False,
+    fn_ext=None,
+):
+    """
+    pass on inputs to the gen_gals function and takes care of I/O
+
+    Parameters
+    ----------
+
+    halos_data : dictionary of arrays
+        a dictionary of halo properties (pos, vel, mass, id, randoms, ...)
+
+    particle_data : dictionary of arrays
+        a dictionary of particle propoerties (pos, vel, hmass, hid, Np, subsampling, randoms, ...)
+
+    tracers : dictionary of dictionaries
+        Dictionary of multi-tracer HODs
+
+    enable_ranks : boolean
+        Flag of whether to implement particle ranks.
+
+    rsd : boolean
+        Flag of whether to implement RSD.
+
+    nfw : boolean
+        Flag of whether to generate satellites from an NFW profile.
+
+    write_to_disk : boolean
+        Flag of whether to output to disk.
+
+    verbose : boolean
+        Whether to output detailed outputs.
+
+    savedir : str
+        where to save the output if write_to_disk == True.
+
+    params : dict
+        Dictionary of various simulation parameters.
+
+    fn_ext: str
+        filename extension for saved files. Only relevant when ``write_to_disk = True``.
+
+    Output
+    ------
+
+    HOD_dict : dictionary of dictionaries
+        Dictionary of the format: {tracer1_dict, tracer2_dict, ...},
+        where tracer1_dict = {x, y, z, vx, vy, vz, mass, id}
+
+    """
+
+    if not isinstance(rsd, bool):
+        raise ValueError('Error: rsd has to be a boolean')
+
+    # find the halos, populate them with galaxies and write them to files
+    HOD_dict = gen_gals(
+        halo_data,
+        particle_data,
+        tracers,
+        params,
+        Nthread,
+        enable_ranks,
+        rsd,
+        verbose,
+        nfw,
+        NFW_draw,
+    )
+
+    # how many galaxies were generated and write them to disk
+    for tracer in tracers.keys():
+        Ncent = HOD_dict[tracer]['Ncent']
+        if verbose:
+            print(
+                'generated %ss:' % tracer,
+                len(HOD_dict[tracer]['x']),
+                'satellite fraction ',
+                1 - Ncent / len(HOD_dict[tracer]['x']),
+            )
+
+        if write_to_disk:
+            if verbose:
+                print('outputting galaxies to disk')
+
+            if rsd:
+                rsd_string = '_rsd'
+            else:
+                rsd_string = ''
+
+            if fn_ext is None:
+                outdir = (savedir) / ('galaxies' + rsd_string)
+            else:
+                outdir = (savedir) / ('galaxies' + rsd_string + fn_ext)
+
+            # create directories if not existing
+            os.makedirs(outdir, exist_ok=True)
+
+            # save to file
+            # outdict =
+            HOD_dict[tracer].pop('Ncent', None)
+            table = Table(
+                HOD_dict[tracer],
+                meta={'Ncent': Ncent, 'Gal_type': tracer, **tracers[tracer]},
+            )
+            if params['chunk'] == -1:
+                ascii.write(
+                    table, outdir / (f'{tracer}s.dat'), overwrite=True, format='ecsv'
+                )
+            else:
+                ascii.write(
+                    table,
+                    outdir / (f"{tracer}s_chunk{params['chunk']:d}.dat"),
+                    overwrite=True,
+                    format='ecsv',
+                )
+
+    return HOD_dict
diff --git a/abacusnbody/hod/abacus_hod.py b/abacusnbody/hod/abacus_hod.py
index de49a210..feabe014 100644
--- a/abacusnbody/hod/abacus_hod.py
+++ b/abacusnbody/hod/abacus_hod.py
@@ -35,6 +35,13 @@
     N_sat_generic,
 )
 
+from .CSMF_HOD import (
+    gen_gal_cat_CSMF,
+    n_cen_CSMF,
+    n_sat_CSMF,
+)
+
+
 # TODO B.H.: staging can be shorter and prettier; perhaps asdf for h5 and ecsv?
 
 
@@ -303,7 +310,7 @@ def staging(self):
         params['numslabs'] = end - start
         self.lbox = header['BoxSize']
 
-        # count ther number of halos and particles
+        # count the number of halos and particles
         Nhalos = np.zeros(params['numslabs'])
         Nparts = np.zeros(params['numslabs'])
         for eslab in range(start, end):
@@ -311,6 +318,7 @@ def staging(self):
                 ('ELG' not in self.tracers.keys())
                 and ('QSO' not in self.tracers.keys())
                 and (not self.force_mt)
+                and ('CSMF' not in self.tracers.keys())
             ):
                 halofilename = subsample_dir / (
                     'halos_xcom_%d_seed600_abacushod_oldfenv' % eslab
@@ -391,6 +399,7 @@ def staging(self):
                 ('ELG' not in self.tracers.keys())
                 and ('QSO' not in self.tracers.keys())
                 and (not self.force_mt)
+                and ('CSMF' not in self.tracers.keys())
             ):
                 halofilename = subsample_dir / (
                     'halos_xcom_%d_seed600_abacushod_oldfenv' % eslab
@@ -756,21 +765,39 @@ def run_hod(
             )
 
         start = time.time()
-        mock_dict = gen_gal_cat(
-            self.halo_data,
-            self.particle_data,
-            tracers,
-            self.params,
-            Nthread,
-            enable_ranks=self.want_ranks,
-            rsd=want_rsd,
-            nfw=want_nfw,
-            NFW_draw=NFW_draw,
-            write_to_disk=write_to_disk,
-            savedir=self.mock_dir,
-            verbose=verbose,
-            fn_ext=fn_ext,
-        )
+        if 'CSMF' in tracers.keys():
+            mock_dict = gen_gal_cat_CSMF(
+                self.halo_data,
+                self.particle_data,
+                tracers,
+                self.params,
+                Nthread,
+                enable_ranks=self.want_ranks,
+                rsd=want_rsd,
+                nfw=want_nfw,
+                NFW_draw=NFW_draw,
+                write_to_disk=write_to_disk,
+                savedir=self.mock_dir,
+                verbose=verbose,
+                fn_ext=fn_ext,
+            )
+        else:
+            mock_dict = gen_gal_cat(
+                self.halo_data,
+                self.particle_data,
+                tracers,
+                self.params,
+                Nthread,
+                enable_ranks=self.want_ranks,
+                rsd=want_rsd,
+                nfw=want_nfw,
+                NFW_draw=NFW_draw,
+                write_to_disk=write_to_disk,
+                savedir=self.mock_dir,
+                verbose=verbose,
+                fn_ext=fn_ext,
+            )
+
         self.logger.info(f'HOD generated in elapsed time {time.time() - start:.2f} s.')
 
         return mock_dict
@@ -892,6 +919,37 @@ def compute_ngal(self, tracers=None, Nthread=16):
                 )
                 ngal_dict[etracer] = newngal[0] + newngal[1]
                 fsat_dict[etracer] = newngal[1] / (newngal[0] + newngal[1])
+
+            elif etracer == 'CSMF':
+                newngal = AbacusHOD._compute_ngal_CSMF(
+                    self.logMbins,
+                    self.deltacbins,
+                    self.fenvbins,
+                    self.halo_mass_func,
+                    tracer_hod['Mstar_low'],
+                    tracer_hod['Mstar_up'],
+                    tracer_hod['M_1'],
+                    tracer_hod['M_0'],
+                    tracer_hod['gamma_1'],
+                    tracer_hod['gamma_2'],
+                    tracer_hod['sigma_c'],
+                    tracer_hod['a_1'],
+                    tracer_hod['a_2'],
+                    tracer_hod['M_2'],
+                    tracer_hod['b_0'],
+                    tracer_hod['b_1'],
+                    tracer_hod['b_2'],
+                    tracer_hod.get('delta_1', 0),
+                    tracer_hod.get('delta_2', 0),
+                    tracer_hod.get('Acent', 0),
+                    tracer_hod.get('Asat', 0),
+                    tracer_hod.get('Bcent', 0),
+                    tracer_hod.get('Bsat', 0),
+                    tracer_hod.get('ic', 1),
+                    Nthread,
+                )
+                ngal_dict[etracer] = newngal[0] + newngal[1]
+                fsat_dict[etracer] = newngal[1] / (newngal[0] + newngal[1])
         return ngal_dict, fsat_dict
 
     @staticmethod
@@ -1095,6 +1153,90 @@ def _compute_ngal_qso(
                     ngal_sat += halo_mass_func[i, j, k] * nsat_temp * ic
         return ngal_cent, ngal_sat
 
+    @staticmethod
+    @njit(fastmath=True, parallel=True)
+    def _compute_ngal_CSMF(
+        logMbins,
+        deltacbins,
+        fenvbins,
+        halo_mass_func,
+        Mstar_low,
+        Mstar_up,
+        M_1,
+        M_0,
+        gamma1,
+        gamma2,
+        sigma_c,
+        a1,
+        a2,
+        M2,
+        b0,
+        b1,
+        b2,
+        delta1,
+        delta2,
+        Acent,
+        Asat,
+        Bcent,
+        Bsat,
+        ic,
+        Nthread,
+    ):
+        """
+        internal helper to compute number of CSMFs
+        """
+        numba.set_num_threads(Nthread)
+
+        logMs = 0.5 * (logMbins[1:] + logMbins[:-1])
+        # deltacs = 0.5 * (deltacbins[1:] + deltacbins[:-1])
+        # fenvs = 0.5 * (fenvbins[1:] + fenvbins[:-1])
+        ngal_cent = 0
+        ngal_sat = 0
+
+        for i in numba.prange(len(logMbins) - 1):
+            for j in range(len(deltacbins) - 1):
+                for k in range(len(fenvbins) - 1):
+                    Mh_temp = 10 ** logMs[i]
+                    M_1_temp = 10 ** (
+                        np.log10(M_1)
+                    )  # + Acent * deltacs[j] + Bcent * fenvs[k])
+                    M2_temp = 10 ** (
+                        np.log10(M2)
+                    )  # + Asat * deltacs[j] + Bsat * fenvs[k])
+
+                    ncent_temp = n_cen_CSMF(
+                        Mh_temp,
+                        Mstar_low,
+                        Mstar_up,
+                        M_1_temp,
+                        M_0,
+                        gamma1,
+                        gamma2,
+                        sigma_c,
+                    )
+                    nsat_temp = n_sat_CSMF(
+                        Mh_temp,
+                        Mstar_low,
+                        Mstar_up,
+                        M_1_temp,
+                        M_0,
+                        gamma1,
+                        gamma2,
+                        sigma_c,
+                        a1,
+                        a2,
+                        M2_temp,
+                        b0,
+                        b1,
+                        b2,
+                        delta1,
+                        delta2,
+                    )
+                    ngal_cent += halo_mass_func[i, j, k] * ncent_temp * ic
+                    ngal_sat += halo_mass_func[i, j, k] * nsat_temp * ic
+
+        return ngal_cent, ngal_sat
+
     def compute_clustering(self, mock_dict, *args, **kwargs):
         """
         Computes summary statistics, currently enabling ``wp`` and ``xirppi``.
diff --git a/tests/.DS_Store b/tests/.DS_Store
new file mode 100644
index 00000000..edd31f3e
Binary files /dev/null and b/tests/.DS_Store differ
diff --git a/tests/CSMF_test.ipynb b/tests/CSMF_test.ipynb
new file mode 100644
index 00000000..a33d3d46
--- /dev/null
+++ b/tests/CSMF_test.ipynb
@@ -0,0 +1,537 @@
+{
+ "cells": [
+  {
+   "cell_type": "markdown",
+   "id": "9b5bdd09-5a9c-4561-b3e1-d57e69bd3a97",
+   "metadata": {},
+   "source": [
+    "\n",
+    "## Importing everything that is needed\n"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 1,
+   "id": "33bc8be4-4f77-4124-a7f1-2f22c700c011",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "import yaml\n",
+    "import numpy as np\n",
+    "from abacusnbody.hod.abacus_hod import AbacusHOD\n",
+    "from astropy.table import Table\n",
+    "from cosmoprimo.utils import DistanceToRedshift\n",
+    "from pyrecon import utils\n",
+    "from cosmoprimo.fiducial import AbacusSummit\n",
+    "import logging\n",
+    "import warnings\n",
+    "from astropy import units as u\n",
+    "\n",
+    "warnings.filterwarnings('ignore', category=np.VisibleDeprecationWarning)\n",
+    "logger = logging.getLogger('ds_abacus_lightcone')"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "87a38aa8-1442-4eb4-9635-f016b73a4514",
+   "metadata": {},
+   "source": [
+    "## Define a function that return the ball sturcture for each halo catalogue. \n",
+    "## HOD parameters are varied in log10, which need to be converted"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 2,
+   "id": "a74223e9-10b7-4184-b5d7-7f6480c0e5fb",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "def get_hod(p, param_mapping, param_tracer, Ball, nthread, seed):\n",
+    "    # read the parameters\n",
+    "    # print(p)\n",
+    "    for key in param_mapping.keys():\n",
+    "        mapping_idx = param_mapping[key]\n",
+    "        tracer_type = param_tracer[key]\n",
+    "        if key == 'sigma' and tracer_type == 'LRG':\n",
+    "            Ball.tracers[tracer_type][key] = 10 ** p[mapping_idx]\n",
+    "        elif key == 'M_0' and tracer_type == 'CSMF':\n",
+    "            Ball.tracers[tracer_type][key] = 10 ** p[mapping_idx]\n",
+    "        elif key == 'M_1' and tracer_type == 'CSMF':\n",
+    "            Ball.tracers[tracer_type][key] = 10 ** p[mapping_idx]\n",
+    "        elif key == 'M_2' and tracer_type == 'CSMF':\n",
+    "            Ball.tracers[tracer_type][key] = 10 ** p[mapping_idx]\n",
+    "        else:\n",
+    "            Ball.tracers[tracer_type][key] = p[mapping_idx]\n",
+    "\n",
+    "    mock_dict = Ball.run_hod(\n",
+    "        tracers=Ball.tracers,\n",
+    "        want_rsd=Ball.want_rsd,\n",
+    "        want_nfw=False,\n",
+    "        NFW_draw=None,\n",
+    "        Nthread=nthread,\n",
+    "        reseed=seed,\n",
+    "        verbose=True,\n",
+    "    )\n",
+    "    return mock_dict"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "5fd41b5f-9415-4e9d-a35a-878c2eb67b5a",
+   "metadata": {},
+   "source": [
+    "## As the name it suggest it set ups the HOD code"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 3,
+   "id": "29a4c90b-ae9f-4749-a965-e97b4413dc1a",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "def setup_hod(config):\n",
+    "    print(f\"Processing {config['sim_params']['sim_name']}\")\n",
+    "    sim_params = config['sim_params']\n",
+    "    HOD_params = config['HOD_params']\n",
+    "    fit_params = config['fit_params']\n",
+    "\n",
+    "    if HOD_params['CSMF_params']['Mstar_low'] < 100:\n",
+    "        HOD_params['CSMF_params']['Mstar_low'] = (\n",
+    "            10 ** HOD_params['CSMF_params']['Mstar_low']\n",
+    "        )\n",
+    "        HOD_params['CSMF_params']['Mstar_up'] = (\n",
+    "            10 ** HOD_params['CSMF_params']['Mstar_up']\n",
+    "        )\n",
+    "\n",
+    "    Balls = []\n",
+    "    for ez in zranges:\n",
+    "        sim_params['z_mock'] = ez\n",
+    "        Balls += [AbacusHOD(sim_params, HOD_params)]\n",
+    "\n",
+    "    param_mapping = {}\n",
+    "    param_tracer = {}\n",
+    "    for key in fit_params.keys():\n",
+    "        mapping_idx = fit_params[key][0]\n",
+    "        tracer_type = fit_params[key][-1]\n",
+    "        param_mapping[key] = mapping_idx\n",
+    "        param_tracer[key] = tracer_type\n",
+    "\n",
+    "    return Balls, param_mapping, param_tracer"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "8bcd8f8a-0ab4-4614-93f9-743786ee2a2c",
+   "metadata": {},
+   "source": [
+    "## Dictionary to contral the code below "
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 4,
+   "id": "0310aa3b-0815-4b73-b1d3-4b62737bf282",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "args_dict = {\n",
+    "    'start_hod': 0,\n",
+    "    'n_hod': 1,\n",
+    "    'start_cosmo': 0,\n",
+    "    'n_cosmo': 1,\n",
+    "    'start_phase': 0,\n",
+    "    'n_phase': 1,\n",
+    "    'survey': 'DESI',\n",
+    "    'tracer': 'CSMF',\n",
+    "    'zmin': 0.1,\n",
+    "    'zmax': 0.4,\n",
+    "    'start_seed': 0,\n",
+    "    'n_seed': 1,\n",
+    "    'nthreads': 5,\n",
+    "}"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "bc4f1cc0-410e-43ea-aee8-5a753d8fc278",
+   "metadata": {},
+   "source": [
+    "## Load in the config file and define the redshifts that combined in the light cone"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 5,
+   "id": "8ac3f830-7bd6-4931-81ef-cbf9aa6266b9",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "config = yaml.safe_load(open('data_CSMF/config_CSMF.yaml'))\n",
+    "zranges = [0.100]"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "97e83b3f-e9f1-4672-8daa-87874d1c1b5c",
+   "metadata": {
+    "tags": []
+   },
+   "source": [
+    "\n",
+    "## Downloading halo data using ``gdown``, which can be intalled with ``pip install gdown``\n"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 6,
+   "id": "35fa5b96-2897-4e90-9214-1aaf71f874aa",
+   "metadata": {
+    "tags": []
+   },
+   "outputs": [
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "Downloading...\n",
+      "From (original): https://drive.google.com/uc?id=1VCBXlkYHChn1HCwRPnq9iDSgzILfXfwL\n",
+      "From (redirected): https://drive.google.com/uc?id=1VCBXlkYHChn1HCwRPnq9iDSgzILfXfwL&confirm=t&uuid=ce478b08-a653-4604-a55d-e2fb144f7ed9\n",
+      "To: /global/u2/p/pierre/abacusutils_modified/tests/data_CSMF/halos_data/AbacusSummit_base_c000_ph000/z0.100/particles_xcom_0_seed600_abacushod_oldfenv_MT_withranks_new.h5\n",
+      "100%|██████████| 260M/260M [00:01<00:00, 173MB/s]  \n",
+      "Downloading...\n",
+      "From (original): https://drive.google.com/uc?id=1xXlbXr8h8AiRFc2p5knYSYloJ9jfcAY9\n",
+      "From (redirected): https://drive.google.com/uc?id=1xXlbXr8h8AiRFc2p5knYSYloJ9jfcAY9&confirm=t&uuid=00ce9d81-134e-41b2-996c-c27bb162fa2c\n",
+      "To: /global/u2/p/pierre/abacusutils_modified/tests/data_CSMF/halos_data/AbacusSummit_base_c000_ph000/z0.100/halos_xcom_0_seed600_abacushod_oldfenv_MT_new.h5\n",
+      "100%|██████████| 108M/108M [00:00<00:00, 138MB/s]  \n"
+     ]
+    },
+    {
+     "data": {
+      "text/plain": [
+       "'data_CSMF/halos_data/AbacusSummit_base_c000_ph000/z0.100/halos_xcom_0_seed600_abacushod_oldfenv_MT_new.h5'"
+      ]
+     },
+     "execution_count": 6,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "import gdown\n",
+    "\n",
+    "gdown.download(\n",
+    "    id='1VCBXlkYHChn1HCwRPnq9iDSgzILfXfwL',\n",
+    "    output='data_CSMF/halos_data/AbacusSummit_base_c000_ph000/z0.100/particles_xcom_0_seed600_abacushod_oldfenv_MT_withranks_new.h5',\n",
+    ")\n",
+    "gdown.download(\n",
+    "    id='1xXlbXr8h8AiRFc2p5knYSYloJ9jfcAY9',\n",
+    "    output='data_CSMF/halos_data/AbacusSummit_base_c000_ph000/z0.100/halos_xcom_0_seed600_abacushod_oldfenv_MT_new.h5',\n",
+    ")"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "ac4e71ce-c351-4ab9-8918-98ef3c9c9f8c",
+   "metadata": {},
+   "source": [
+    "## Decide which cosmology, hod, seed and phase and prepare the HOD parameters"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 7,
+   "id": "f10e377e-3688-4491-8f71-5e8f3aae2a11",
+   "metadata": {
+    "tags": []
+   },
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "[10.96635881 11.49130401 27.75835925  0.18179997  0.29946413  2.14532573\n",
+      "  0.41764339  0.46919005 -1.42349829 -0.49794641  0.53148565]\n"
+     ]
+    }
+   ],
+   "source": [
+    "cosmo = 0\n",
+    "phase = 0\n",
+    "seed = 0\n",
+    "hod = 0\n",
+    "\n",
+    "HOD_params = Table.read('data_CSMF/HOD_parameters.fits')\n",
+    "names = [\n",
+    "    'log_M_0',\n",
+    "    'log_M_1',\n",
+    "    'gamma_1',\n",
+    "    'gamma_2',\n",
+    "    'sigma_c',\n",
+    "    'a_1',\n",
+    "    'b_0',\n",
+    "    'b_1',\n",
+    "    's',\n",
+    "    'Bcent',\n",
+    "    'Bsat',\n",
+    "]\n",
+    "\n",
+    "HOD_params_np = []\n",
+    "for name in names:\n",
+    "    HOD_params_np.append(np.array(HOD_params[name]))\n",
+    "HOD_params_np = np.array(HOD_params_np).T\n",
+    "print(HOD_params_np[hod])"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "dfb02196-acda-48f7-82e2-0c3014ac0459",
+   "metadata": {},
+   "source": [
+    "## Run the HOD code and write data to astropy Table"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 8,
+   "id": "3dd8dce1-a1f9-4d5c-81f2-c235a3fa9963",
+   "metadata": {
+    "tags": []
+   },
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "Processing AbacusSummit_base_c000_ph000\n",
+      "generating centrals took  37.29109263420105\n",
+      "generating satellites took  44.424450635910034\n",
+      "CSMF number of galaxies  53496\n",
+      "satellite fraction  0.7775721549274712\n",
+      "organizing outputs took  5.719436407089233\n",
+      "generated CSMFs: 53496 satellite fraction  0.7775721549274712\n"
+     ]
+    }
+   ],
+   "source": [
+    "mock_cosmo = AbacusSummit(cosmo)\n",
+    "Balls, param_mapping, param_tracer = setup_hod(config)\n",
+    "\n",
+    "data_positions_sky = []\n",
+    "for i, newBall in enumerate(Balls):\n",
+    "    hod_dict = get_hod(\n",
+    "        HOD_params_np[hod],\n",
+    "        param_mapping,\n",
+    "        param_tracer,\n",
+    "        newBall,\n",
+    "        args_dict['nthreads'],\n",
+    "        seed,\n",
+    "    )\n",
+    "    data = hod_dict[args_dict['tracer']]\n",
+    "\n",
+    "    dist, ra, dec = utils.cartesian_to_sky(\n",
+    "        np.c_[data['x'] + 990, data['y'] + 990, data['z'] + 990]\n",
+    "    )\n",
+    "    d2z = DistanceToRedshift(mock_cosmo.comoving_radial_distance)\n",
+    "    redshift = d2z(dist)\n",
+    "\n",
+    "    mask = (\n",
+    "        (redshift >= args_dict['zmin'])\n",
+    "        & (redshift <= args_dict['zmax'])\n",
+    "        & (data['stellarmass'] > 0)\n",
+    "    )\n",
+    "    central_id = np.zeros_like(data['stellarmass'])\n",
+    "    central_id[: data['Ncent']] = 1\n",
+    "\n",
+    "    data_positions_sky.append(\n",
+    "        np.c_[\n",
+    "            ra[mask],\n",
+    "            dec[mask],\n",
+    "            dist[mask],\n",
+    "            redshift[mask],\n",
+    "            data['stellarmass'][mask],\n",
+    "            data['mass'][mask],\n",
+    "            central_id[mask],\n",
+    "        ]\n",
+    "    )\n",
+    "data_positions_sky = np.concatenate(data_positions_sky, axis=0)\n",
+    "\n",
+    "HOD_table = Table()\n",
+    "HOD_table['ra'] = data_positions_sky[:, 0].astype(np.float32)\n",
+    "HOD_table['dec'] = data_positions_sky[:, 1].astype(np.float32)\n",
+    "HOD_table['comoving_distance_overh'] = (\n",
+    "    data_positions_sky[:, 2].astype(np.float32) * u.Mpc\n",
+    ")\n",
+    "HOD_table['redshift'] = data_positions_sky[:, 3].astype(np.float32)\n",
+    "HOD_table['log10Mstar_overhsquare'] = (\n",
+    "    np.log10(data_positions_sky[:, 4]).astype(np.float64) * u.Msun\n",
+    ")\n",
+    "HOD_table['log10Mhalo_overh'] = (\n",
+    "    np.log10(data_positions_sky[:, 5]).astype(np.float64) * u.Msun\n",
+    ")\n",
+    "HOD_table['central flag'] = data_positions_sky[:, 6].astype(np.int32)\n",
+    "\n",
+    "HOD_table.write(\n",
+    "    f'data_CSMF/galaxy_catalogue_cos{cosmo:03}_ph{phase:03}_hod{hod:03}_seed{seed:03}.fits',\n",
+    "    overwrite=True,\n",
+    ")"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 9,
+   "id": "464b26e4-8916-4844-a27d-0b87a4a58b64",
+   "metadata": {
+    "tags": []
+   },
+   "outputs": [
+    {
+     "data": {
+      "text/html": [
+       "<div><i>Table length=53476</i>\n",
+       "<table id=\"table140207710245008\" class=\"table-striped table-bordered table-condensed\">\n",
+       "<thead><tr><th>ra</th><th>dec</th><th>comoving_distance_overh</th><th>redshift</th><th>log10Mstar_overhsquare</th><th>log10Mhalo_overh</th><th>central flag</th></tr></thead>\n",
+       "<thead><tr><th></th><th></th><th>Mpc</th><th></th><th>solMass</th><th>solMass</th><th></th></tr></thead>\n",
+       "<thead><tr><th>float32</th><th>float32</th><th>float32</th><th>float32</th><th>float64</th><th>float64</th><th>int32</th></tr></thead>\n",
+       "<tr><td>89.80145</td><td>61.005356</td><td>313.05255</td><td>0.10718833</td><td>10.669699803548644</td><td>13.15851407014397</td><td>1</td></tr>\n",
+       "<tr><td>89.96813</td><td>15.081102</td><td>314.77386</td><td>0.10779407</td><td>10.661428342597803</td><td>12.567379512545882</td><td>1</td></tr>\n",
+       "<tr><td>89.60284</td><td>77.63843</td><td>297.2059</td><td>0.10162075</td><td>11.04491605968148</td><td>12.787388976424438</td><td>1</td></tr>\n",
+       "<tr><td>89.90948</td><td>79.4423</td><td>362.13913</td><td>0.12453798</td><td>10.457635730746278</td><td>12.501052347049345</td><td>1</td></tr>\n",
+       "<tr><td>89.011246</td><td>79.60034</td><td>358.28885</td><td>0.12317138</td><td>11.104613250739858</td><td>13.219736871286516</td><td>1</td></tr>\n",
+       "<tr><td>89.32601</td><td>75.91486</td><td>308.97787</td><td>0.10575519</td><td>10.88640251020487</td><td>13.195783032147952</td><td>1</td></tr>\n",
+       "<tr><td>89.75433</td><td>73.1615</td><td>343.47256</td><td>0.117921665</td><td>11.388144911160552</td><td>12.820884682162479</td><td>1</td></tr>\n",
+       "<tr><td>89.69066</td><td>62.50087</td><td>302.8254</td><td>0.10359327</td><td>11.11171486330106</td><td>13.362673792424015</td><td>1</td></tr>\n",
+       "<tr><td>89.66637</td><td>64.31412</td><td>341.10883</td><td>0.11708548</td><td>11.299165012450777</td><td>13.09722129049577</td><td>1</td></tr>\n",
+       "<tr><td>...</td><td>...</td><td>...</td><td>...</td><td>...</td><td>...</td><td>...</td></tr>\n",
+       "<tr><td>3.0228546</td><td>1.523003</td><td>363.0755</td><td>0.12487049</td><td>10.697835970470262</td><td>12.717844006810516</td><td>0</td></tr>\n",
+       "<tr><td>3.029087</td><td>1.5405174</td><td>362.981</td><td>0.12483694</td><td>10.433693223702878</td><td>12.717844006810516</td><td>0</td></tr>\n",
+       "<tr><td>3.0400407</td><td>1.5345762</td><td>363.1828</td><td>0.124908604</td><td>10.517115508168002</td><td>12.717844006810516</td><td>0</td></tr>\n",
+       "<tr><td>2.3302634</td><td>0.028755056</td><td>365.99042</td><td>0.12590595</td><td>10.537922530628641</td><td>13.252438001727299</td><td>0</td></tr>\n",
+       "<tr><td>2.3254724</td><td>0.055217672</td><td>365.89832</td><td>0.12587322</td><td>10.424138818713901</td><td>13.252438001727299</td><td>0</td></tr>\n",
+       "<tr><td>2.3186884</td><td>0.051970188</td><td>366.02066</td><td>0.12591669</td><td>10.539820877719254</td><td>13.252438001727299</td><td>0</td></tr>\n",
+       "<tr><td>2.3204777</td><td>0.04352397</td><td>365.93283</td><td>0.12588549</td><td>10.71973916444486</td><td>13.252438001727299</td><td>0</td></tr>\n",
+       "<tr><td>2.3323631</td><td>0.010766512</td><td>365.90237</td><td>0.12587467</td><td>10.447551706193318</td><td>13.252438001727299</td><td>0</td></tr>\n",
+       "<tr><td>2.3465645</td><td>0.03120295</td><td>366.13522</td><td>0.1259574</td><td>10.667618111179596</td><td>13.252438001727299</td><td>0</td></tr>\n",
+       "<tr><td>2.3431413</td><td>0.0038444304</td><td>365.9732</td><td>0.12589984</td><td>10.503682171749702</td><td>13.252438001727299</td><td>0</td></tr>\n",
+       "</table></div>"
+      ],
+      "text/plain": [
+       "<Table length=53476>\n",
+       "    ra        dec      ...  log10Mhalo_overh  central flag\n",
+       "                       ...      solMass                   \n",
+       " float32    float32    ...      float64          int32    \n",
+       "--------- ------------ ... ------------------ ------------\n",
+       " 89.80145    61.005356 ...  13.15851407014397            1\n",
+       " 89.96813    15.081102 ... 12.567379512545882            1\n",
+       " 89.60284     77.63843 ... 12.787388976424438            1\n",
+       " 89.90948      79.4423 ... 12.501052347049345            1\n",
+       "89.011246     79.60034 ... 13.219736871286516            1\n",
+       " 89.32601     75.91486 ... 13.195783032147952            1\n",
+       " 89.75433      73.1615 ... 12.820884682162479            1\n",
+       " 89.69066     62.50087 ... 13.362673792424015            1\n",
+       " 89.66637     64.31412 ...  13.09722129049577            1\n",
+       "      ...          ... ...                ...          ...\n",
+       "3.0228546     1.523003 ... 12.717844006810516            0\n",
+       " 3.029087    1.5405174 ... 12.717844006810516            0\n",
+       "3.0400407    1.5345762 ... 12.717844006810516            0\n",
+       "2.3302634  0.028755056 ... 13.252438001727299            0\n",
+       "2.3254724  0.055217672 ... 13.252438001727299            0\n",
+       "2.3186884  0.051970188 ... 13.252438001727299            0\n",
+       "2.3204777   0.04352397 ... 13.252438001727299            0\n",
+       "2.3323631  0.010766512 ... 13.252438001727299            0\n",
+       "2.3465645   0.03120295 ... 13.252438001727299            0\n",
+       "2.3431413 0.0038444304 ... 13.252438001727299            0"
+      ]
+     },
+     "execution_count": 9,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "HOD_table"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "a27302e4-b366-432e-a883-c16fd7f0806d",
+   "metadata": {},
+   "source": [
+    "## Download reference catalogue and compare it with the new generated output. Note that stellar masses are different for each run by construction."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 10,
+   "id": "469d1e69-940a-4a02-9af0-0942ee49cdb7",
+   "metadata": {
+    "tags": []
+   },
+   "outputs": [
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "Downloading...\n",
+      "From: https://drive.google.com/uc?id=1JB5UvLM13wj6IdRvF37-Dh8kRjJWzWh0\n",
+      "To: /global/u2/p/pierre/abacusutils_modified/tests/data_CSMF/reference_galaxy_catalogue_cos000_ph000_hod000_seed000.fits\n",
+      "100%|██████████| 1.93M/1.93M [00:00<00:00, 16.1MB/s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "\u001b[92m \"ra\" is close to the reference catalogue\n",
+      "\u001b[92m \"dec\" is close to the reference catalogue\n",
+      "\u001b[92m \"comoving_distance_overh\" is close to the reference catalogue\n",
+      "\u001b[92m \"redshift\" is close to the reference catalogue\n",
+      "\u001b[91m \"log10Mstar_overhsquare\" is different to the reference catalogue\n",
+      "\u001b[92m \"log10Mhalo_overh\" is close to the reference catalogue\n",
+      "\u001b[92m \"central flag\" is close to the reference catalogue\n"
+     ]
+    }
+   ],
+   "source": [
+    "from common import check_close\n",
+    "\n",
+    "gdown.download(\n",
+    "    id='1JB5UvLM13wj6IdRvF37-Dh8kRjJWzWh0',\n",
+    "    output=f'data_CSMF/reference_galaxy_catalogue_cos{cosmo:03}_ph{phase:03}_hod{hod:03}_seed{seed:03}.fits',\n",
+    ")\n",
+    "HOD_table_ref = Table.read(\n",
+    "    f'data_CSMF/reference_galaxy_catalogue_cos{cosmo:03}_ph{phase:03}_hod{hod:03}_seed{seed:03}.fits'\n",
+    ")\n",
+    "\n",
+    "\n",
+    "for name in HOD_table_ref.colnames:\n",
+    "    if check_close(HOD_table_ref[name], HOD_table[name]):\n",
+    "        print('\\033[92m \"' + name + r'\" is close to the reference catalogue')\n",
+    "    else:\n",
+    "        print('\\033[91m \"' + name + r'\" is different to the reference catalogue')"
+   ]
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": "AbacusHOD_env",
+   "language": "python",
+   "name": "abacushod_env"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.11.8"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 5
+}
diff --git a/tests/data_CSMF/.DS_Store b/tests/data_CSMF/.DS_Store
new file mode 100644
index 00000000..d2784d5e
Binary files /dev/null and b/tests/data_CSMF/.DS_Store differ
diff --git a/tests/data_CSMF/HOD_parameters.fits b/tests/data_CSMF/HOD_parameters.fits
new file mode 100644
index 00000000..00885bb7
Binary files /dev/null and b/tests/data_CSMF/HOD_parameters.fits differ
diff --git a/tests/data_CSMF/config_CSMF.yaml b/tests/data_CSMF/config_CSMF.yaml
new file mode 100644
index 00000000..a2f1a9ad
--- /dev/null
+++ b/tests/data_CSMF/config_CSMF.yaml
@@ -0,0 +1,89 @@
+# Comment out the probes you don't need
+# CAREFUL: yaml is super sensitive to spaces - don't use tabs
+
+# Simulation parameters
+sim_params:
+    sim_name: 'AbacusSummit_base_c000_ph000'                                 # which simulation
+    sim_dir: '/global/cfs/cdirs/desi/public/cosmosim/AbacusSummit/halo_light_cones/'  # where is the simulation
+    subsample_dir: 'data_CSMF/halos_data/'
+    cleaned_halos: 'data_CSMF/halos_data/'
+
+    # subsample_dir: '/pscratch/sd/p/pierre/AbacusSummit/subsamples/'
+    # cleaned_halos: '/pscratch/sd/p/pierre/AbacusSummit/subsamples/'
+
+    Nthread_load: 10
+    z_mock: 0.100
+    halo_lc: True
+
+    # subsample_dir: ‘/pscratch/sd/b/boryanah/AbacusHOD_scratch/mocks_lc_subsample/’
+
+prepare_sim:
+    Nparallel_load: 10 # best for cori haswell node
+
+# HOD parameters
+HOD_params:
+    use_particles: True
+    want_ranks: True               # want to implement satellite profile flexiblities?
+    want_AB: True               # want to implement assembly bias?
+    density_sigma: 3               # scale radius in Mpc / h for local density calculation
+    tracer_flags:                  # which tracer do we want?
+        LRG: False
+        ELG: False
+        QSO: False
+        CSMF: True
+    want_rsd: True                 # want RSD?
+    write_to_disk: False
+
+    CSMF_params:
+        Mstar_low: 10.4
+        Mstar_up: 12.1
+        M_0: 9.935
+        M_1: 11.07
+        gamma_1: 3.273
+        gamma_2: 0.255
+        sigma_c: 0.143
+        a_1: 0.501
+        a_2: 0
+        M_2: 14.28
+        b_0: -0.766
+        b_1: 1.008
+        b_2: 0
+        delta_1: 0.0
+        delta_2: 0.0
+        alpha_c: 0.0
+        alpha_s: 0.0
+        s: 0
+        s_v: 0
+        s_p: 0
+        s_r: 0
+        Acent: 0
+        Asat: 0
+        Bcent: 0
+        Bsat: 0
+        ic: 1.0
+
+fit_params:
+    M_0: [0, 'CSMF']
+    M_1: [1, 'CSMF']
+    gamma_1: [2, 'CSMF']
+    gamma_2: [3,  'CSMF']
+    sigma_c: [4, 'CSMF']
+    a_1: [5, 'CSMF']
+    b_0: [6, 'CSMF']
+    b_1: [7, 'CSMF']
+    s: [8, 'CSMF']
+    Bcent: [9, 'CSMF']
+    Bsat: [10, 'CSMF']
+
+
+# ===========================================================================================
+# The following dictionaries are for using the provided emcee/likelihood templates. They
+# are not needed for using the AbacusHOD class and running HODs.
+
+# parameters that indicate where the observed data that you would like to fit live.
+data_params:
+
+
+
+# Configuration parameters for emcee
+ch_config_params:
diff --git a/tests/data_CSMF/halos_data/.DS_Store b/tests/data_CSMF/halos_data/.DS_Store
new file mode 100644
index 00000000..5008ddfc
Binary files /dev/null and b/tests/data_CSMF/halos_data/.DS_Store differ