Source code for beetroots.approx_optim.nn_bo

from typing import Dict, List, Union

import numpy as np
from scipy.stats import gaussian_kde
from tqdm.auto import tqdm

from beetroots.approx_optim.abstract_approx_optim import ApproxParamsOptim
from beetroots.approx_optim.approach_type.bo import BayesianOptimizationApproach
from beetroots.approx_optim.forward_map.nn import ApproxOptimNN



[docs]
class ApproxParamsOptimNNBO(
    ApproxParamsOptim, ApproxOptimNN, BayesianOptimizationApproach
):
    r"""class that performs likelihood parameter optimization using Bayesian optimization for a neural network forward map"""


[docs]
    def main(
        self,
        dict_forward_model: Dict[str, Union[str, bool, List[bool], List[float]]],
        lower_bounds_lin: Union[np.ndarray, List],
        upper_bounds_lin: Union[np.ndarray, List],
        n_iter: int,
    ):
        r"""main method of the class, sets up the optimization problems and solves them

        Parameters
        ----------
        dict_forward_model : Dict[str, Union[str, bool, List[bool], List[float], Dict[str, float]]]
            contains the necessary information to load the forward model with the :class:`NeuralNetworkApprox`
        lower_bounds_lin : Union[np.ndarray, List]
            lower bounds on the physical parameters (in linear scale)
        upper_bounds_lin : Union[np.ndarray, List]
            upper bounds on the physical parameters (in linear scale)
        n_iter : int
            number of iterations for the Bayesian optimization
        """

        assert isinstance(dict_forward_model["forward_model_name"], str)
        # assert isinstance(angle, float)

        if isinstance(lower_bounds_lin, list):
            lower_bounds_lin = np.array(lower_bounds_lin)
        if isinstance(upper_bounds_lin, list):
            upper_bounds_lin = np.array(upper_bounds_lin)

        assert isinstance(lower_bounds_lin, np.ndarray)
        assert isinstance(upper_bounds_lin, np.ndarray)
        assert isinstance(n_iter, int) and n_iter > 0

        if isinstance(lower_bounds_lin, list):
            lower_bounds_lin = np.array(lower_bounds_lin)
        if isinstance(lower_bounds_lin, list):
            lower_bounds_lin = np.array(lower_bounds_lin)

        assert isinstance(dict_forward_model["fixed_params"], dict)
        self.list_idx_sampling = [
            i
            for i, v in enumerate(dict_forward_model["fixed_params"].values())
            if v is None
        ]
        r"""List[int]: indices of physical parameters considered as variables for the likelihood parameter adjustment"""

        self.D_sampling = len(self.list_idx_sampling)
        r"""int: number of physical parameters considered as variables for the likelihood parameter adjustment"""

        self.N_samples_theta = self.K**self.D_sampling
        r"""int: number of samples for :math:`\theta` used to build the histogram of :math:`\log_{10} f_\ell(\theta)`"""

        print("starting setup")
        # step 1: set the bounds for the parameters to be adjusted
        (
            log10_f0,
            bounds_a0_low,
            bounds_a0_high,
            bounds_a1_low,
            bounds_a1_high,
        ) = self.setup_params_bounds()

        # step 2: compute the histogram of log f(theta)
        log10_f_Theta = self.compute_log10_f_Theta(
            dict_forward_model,
            lower_bounds_lin,
            upper_bounds_lin,
        )
        log10_f_Theta_low = log10_f_Theta.min(axis=0)  # (L,)
        log10_f_Theta_high = log10_f_Theta.max(axis=0)  # (L,)

        # step 3: set the KDE on log10 f_\ell(theta)
        print(r"starting evaluation of kde of log10 f_\ell(theta)")
        list_log10_f_grid = np.zeros((self.log10_f_grid_size, self.L))
        pdf_kde_log10_f_Theta = np.zeros((self.log10_f_grid_size, self.L))
        for ell in range(self.L):
            list_log10_f_grid[:, ell] = np.linspace(
                log10_f_Theta_low[ell],
                log10_f_Theta_high[ell],
                self.log10_f_grid_size,
            )
            kde_log10_f_Theta = gaussian_kde(log10_f_Theta[:, ell])
            pdf_kde_log10_f_Theta[:, ell] = kde_log10_f_Theta.pdf(
                list_log10_f_grid[:, ell],
            )
        print(r"evaluation of kde of log10 f_\ell(theta) done")

        print(
            f"Starting the optimization. Number of optimization to run per line = {self.N_optim_per_line}"
        )
        for ell in tqdm(range(self.L)):
            print(f"starting line {ell} ({self.list_lines[ell]})")
            self.plot_hist_log10_f_Theta(
                log10_f_Theta[:, ell],
                log10_f_Theta_low[ell],
                log10_f_Theta_high[ell],
                list_log10_f_grid[:, ell],
                pdf_kde_log10_f_Theta[:, ell],
                ell,
            )

            for n in tqdm(range(self.N_optim_per_line)):
                pbounds = {
                    "a0": (bounds_a0_low[n, ell], bounds_a0_high[n, ell]),
                    "a1": (bounds_a1_low, bounds_a1_high),
                }
                self.save_setup_to_json(n, ell, pbounds)
                self.optimization(
                    first_points=[(log10_f0[n, ell], 0.5)],
                    init_points=3,
                    n_iter=n_iter,  # 50
                    list_log10_f_grid=list_log10_f_grid[:, ell],
                    pdf_kde_log10_f_Theta=pdf_kde_log10_f_Theta[:, ell],
                    pbounds=pbounds,
                    sigma_a_val=self.sigma_a[n, ell],
                    sigma_m_val=self.sigma_m[n, ell],
                    n=n,
                    ell=ell,
                )

        df_best = self.extract_optimal_params()
        df_best = df_best.set_index(["n", "ell"])

        self.plot_params_with_sigma_a(df_best)

        for n in range(self.N_optim_per_line):
            for ell in range(self.L):
                best_point = df_best.loc[(n, ell), ["a0_best", "a1_best"]].values
                self.plot_hist_log10_f_Theta_with_optim_results(
                    log10_f_Theta=log10_f_Theta[:, ell],
                    log10_f_Theta_low=log10_f_Theta_low[ell],
                    log10_f_Theta_high=log10_f_Theta_high[ell],
                    list_log10_f_grid=list_log10_f_grid[:, ell],
                    pdf_kde_log10_f_Theta=pdf_kde_log10_f_Theta[:, ell],
                    n=n,
                    ell=ell,
                    best_point=best_point,
                )

        self.plots_postprocessing(
            bounds_a0_low,
            bounds_a0_high,
            bounds_a1_low,
            bounds_a1_high,
            n_iter,
        )
        return