Source code for lib.Qfit

import os, sys

import emcee
import numpy as np
from multiprocess import Pool
from schwimmbad import MPIPool

__path__ = os.path.dirname(os.path.dirname(os.path.abspath(__file__)))



[docs]
class FitEllSpace:
    def __init__(self, x, y, yerr, model, parameters_file, sample_variance=True, fsky=None, dl=30, diagonal=False):
        self.x = x
        self.y = y
        self.yerr = yerr
        self.model = model

        self.params = parameters_file
        self.list_components = ["cmb", "dust", "synchrotron", "correlation"]

        ### Check if the user is giving the right dimensions
        self._check_shapein()

        ### Keep only the upper part of the matrix
        self._reshape_spectra()

        ### Reshape data to have two dimensions maximum
        self._init_reshape_data()

        ### Compute the noise covariance matrix
        self._get_noise_covariance_matrix(sample_variance=sample_variance, fsky=fsky, dl=dl, diagonal=diagonal)


[docs]
    def get_fitting_parameters_names(self):
        fit_param_names = []

        for comp in self.list_components:
            if comp not in self.params:
                continue

            for param_name, param_info in self.params[comp].items():
                # Only add if "fit" key exists and is True
                if isinstance(param_info, dict) and param_info.get("fit") is True:
                    fit_param_names.append(param_name)

        return np.array(fit_param_names)


    def _reshape_spectra_model(self, data):
        data_reshaped = np.zeros((self.nspecs, self.nbins))

        k = 0
        for imap in range(self.nmaps):
            for jmap in range(imap, self.nmaps):
                data_reshaped[k, :] = data[imap, jmap]
                k += 1

        return data_reshaped

    def _reshape_spectra(self):
        self.y_reshaped = np.zeros((self.nspecs, self.nbins))
        self.yerr_reshaped = np.zeros((self.nreals, self.nspecs, self.nbins))

        k = 0
        for imap in range(self.nmaps):
            for jmap in range(imap, self.nmaps):
                self.y_reshaped[k, :] = self.y[imap, jmap]
                self.yerr_reshaped[:, k, :] = self.yerr[:, imap, jmap, :]
                k += 1

    def _check_shapein(self):
        if self.x.ndim != 1:
            raise TypeError("x should have 1 dimensions (Nbins)")

        if self.y.ndim != 3:
            raise TypeError("y should have 3 dimensions (Nmaps, Nmaps, Nbins)")

        if self.yerr.ndim != 4:
            raise TypeError("yerr should have 4 dimensions (Nreals, Nmaps, Nmaps, Nbins)")

        ### Get the shape (Nreals, Nmaps, Nmaps, Nbins)
        self.nreals, self.nmaps, _, self.nbins = self.yerr.shape
        self.nspecs = self.nmaps * (self.nmaps + 1) // 2

    def _init_reshape_data(self):
        self.y_reshaped = self.y_reshaped.reshape((self.nspecs * self.nbins))
        self.yerr_reshaped = self.yerr_reshaped.reshape((self.nreals, self.nspecs * self.nbins))

    def _get_noise_covariance_matrix(self, sample_variance, fsky, dl, diagonal=False):
        self.noise_covariance_matrix = np.cov(self.yerr_reshaped, rowvar=False)
        self.noise_correlation_matrix = np.corrcoef(self.yerr_reshaped, rowvar=False)

        if diagonal:
            self.noise_covariance_matrix = self.noise_covariance_matrix.reshape((self.nbins, self.nspecs, self.nbins, self.nspecs))

            for ispec in range(self.nspecs):
                for jspec in range(self.nspecs):
                    self.noise_covariance_matrix[:, ispec, :, jspec] *= np.eye(self.nbins)

            self.noise_covariance_matrix = self.noise_covariance_matrix.reshape((self.nbins * self.nspecs, self.nbins * self.nspecs))

        if sample_variance:
            self.noise_covariance_matrix += self._fill_sample_variance(self.y, fsky, dl)

        self.invN = np.linalg.pinv(self.noise_covariance_matrix)

    def _fill_sample_variance(self, bandpower, fsky, dl):
        indices_tr = np.triu_indices(self.nmaps)
        matrix = np.zeros((self.nspecs, len(self.x), self.nspecs, len(self.x)))
        factor_modecount = 1 / ((2 * self.x + 1) * fsky * dl)

        for ii, (i1, i2) in enumerate(zip(indices_tr[0], indices_tr[1])):
            for jj, (j1, j2) in enumerate(zip(indices_tr[0], indices_tr[1])):
                covar = (bandpower[i1, j1, :] * bandpower[i2, j2, :] + bandpower[i1, j2, :] * bandpower[i2, j1, :]) * factor_modecount
                matrix[ii, :, jj, :] = np.diag(covar)
        return matrix.reshape((self.nspecs * len(self.x), self.nspecs * len(self.x)))

    def _initial_conditions(self, nwalkers):
        x0 = np.zeros((0, nwalkers))
        keys = self.params.keys()

        for key in keys:
            if key not in self.list_components:
                continue
            params = self.params[key]
            for param in params:
                ### Check if the user define the parameter as free and not fixed at given value
                if self.params[key][param]["fit"] and type(self.params[key][param]["fit"]) is bool:
                    x0 = np.concatenate(
                        (
                            x0,
                            np.random.normal(
                                self.params[key][param]["init_average"],
                                self.params[key][param]["init_std"],
                                (1, nwalkers),
                            ),
                        ),
                        axis=0,
                    )

        self.ndim = x0.shape[0]

        return x0.T


[docs]
    def log_prior(self, x):
        keys = self.params.keys()
        count = 0
        for key in keys:
            if key not in self.list_components:
                continue
            params = self.params[key].keys()
            for param in params:
                if x[count] > self.params[key][param]["bound_max"] or x[count] < self.params[key][param]["bound_min"]:
                    return -np.inf
                count += 1

        return 0


    def _fill_params(self, x):
        xnew = np.array([])
        comps = self.params.keys()
        count = 0
        for key in comps:
            if key not in self.list_components:
                continue
            params = self.params[key].keys()
            for param in params:
                ### Add values of the fixed parameters only if there is no True in the params.yaml file
                if self.params[key][param]["fit"] is True:
                    xnew = np.append(xnew, x[count])
                    count += 1
                else:
                    xnew = np.append(xnew, self.params[key][param]["fit"])

        return xnew


[docs]
    def loglikelihood(self, x):
        ### Fill in array with fixed and free parameters
        x = self._fill_params(x)

        lp = self.log_prior(x)
        residuals = self.y_reshaped - self._reshape_spectra_model(self.model(*x)).reshape(self.y_reshaped.shape)

        return lp - 0.5 * ((residuals).T @ self.invN @ (residuals))



[docs]
    def run(self, nsteps, nwalkers, discard=0, comm=None):
        x0 = self._initial_conditions(nwalkers)

        # MPI mode
        if comm is not None and comm.Get_size() > 1:
            if comm.Get_rank() == 0:
                print("Running with MPI")

            sampler = emcee.EnsembleSampler(
                nwalkers, self.ndim, log_prob_fn=self.loglikelihood
            )
            sampler.run_mcmc(x0, nsteps, progress=True)

        # Local multiprocessing
        else:
            print("Running on multi-threading")

            import os
            from multiprocess import Pool

            nproc = int(os.environ.get("SLURM_CPUS_PER_TASK", 4))

            with Pool(processes=nproc) as pool:
                sampler = emcee.EnsembleSampler(
                    nwalkers, self.ndim, log_prob_fn=self.loglikelihood, pool=pool
                )
                sampler.run_mcmc(x0, nsteps, progress=True)

        samples_flat = sampler.get_chain(flat=True, discard=discard, thin=15)
        samples = sampler.get_chain()

        return samples, samples_flat