Source code for tf_pwa.config_loader.multi_config

import contextlib
import copy
import functools
import itertools
import json
import os
import re
import time
import warnings

import matplotlib.pyplot as plt
import numpy as np
import sympy as sy
import yaml
from scipy.interpolate import interp1d
from scipy.optimize import BFGS, basinhopping, minimize

from tf_pwa.amp import (
    AmplitudeModel,
    DecayChain,
    DecayGroup,
    get_decay,
    get_particle,
)
from tf_pwa.applications import (
    cal_hesse_error,
    corr_coef_matrix,
    fit,
    fit_fractions,
)
from tf_pwa.cal_angle import prepare_data_from_decay
from tf_pwa.data import (
    data_index,
    data_merge,
    data_shape,
    data_split,
    data_to_numpy,
    load_data,
    save_data,
)
from tf_pwa.fit import FitResult
from tf_pwa.fit_improve import minimize as my_minimize
from tf_pwa.model import FCN, CombineFCN, Model, Model_new
from tf_pwa.model.cfit import Model_cfit
from tf_pwa.particle import split_particle_type
from tf_pwa.root_io import has_uproot, save_dict_to_root
from tf_pwa.utils import time_print
from tf_pwa.variable import Variable, VarsManager

from .config_loader import ConfigLoader
from .decay_config import DecayConfig



[docs]
class MultiConfig(object):
    def __init__(
        self,
        file_names,
        vm=None,
        total_same=False,
        share_dict={},
        multi_gpu=False,
    ):
        if vm is None:
            self.vm = VarsManager(multi_gpu=multi_gpu)
            # print(self.vm)
        else:
            self.vm = vm
        self.total_same = total_same
        self.configs = []
        for i in file_names:
            if isinstance(i, (str, dict)):
                c = ConfigLoader(i, vm=self.vm, share_dict=share_dict)
            elif isinstance(i, list):
                from tf_pwa.config_loader import MixConfig

                c = MixConfig(i, vm=self.vm, share_dict=share_dict)
            else:
                raise ValueError("config for {} is not supported".format(i))
            self.configs.append(c)
        self.bound_dic = {}
        self.gauss_constr_dic = {}
        self._neglect_when_set_params = []
        self.cached_fcn = {}
        self.inv_he = None


[docs]
    def get_all_data(self):
        return [i.get_all_data() for i in self.configs]



[docs]
    def get_amplitudes(self, vm=None):
        if not self.total_same:
            amps = [
                j.get_amplitude(name="s" + str(i), vm=vm)
                for i, j in enumerate(self.configs)
            ]
        else:
            amps = [j.get_amplitude(vm=vm) for j in self.configs]
        for i in self.configs:
            self.bound_dic.update(i.bound_dic)
            self.gauss_constr_dic.update(i.gauss_constr_dic)
            for j in i._neglect_when_set_params:
                if j not in self._neglect_when_set_params:
                    self._neglect_when_set_params.append(j)
        return amps


    """
    def _get_models(self, vm=None): # get_model is useless to users given get_fcn and get_amplitude
        if not self.total_same:
            models = [j._get_model(name="s"+str(i), vm=vm)
                      for i, j in enumerate(self.configs)]
        else:
            models = [j._get_model(vm=vm) for j in self.configs]
        return models
    """


[docs]
    def get_fcns(self, datas=None, vm=None, batch=65000):
        if datas is not None:
            if not self.total_same:
                fcns = [
                    i[1].get_fcn(
                        name="s" + str(i[0]),
                        all_data=j,
                        vm=vm,
                        batch=batch,
                    )
                    for i, j in zip(enumerate(self.configs), datas)
                ]
            else:
                fcns = [
                    j.get_fcn(
                        all_data=data,
                        vm=vm,
                        batch=batch,
                    )
                    for data, j in zip(datas, self.configs)
                ]
        else:
            if not self.total_same:
                fcns = [
                    j.get_fcn(
                        name="s" + str(i),
                        vm=vm,
                        batch=batch,
                    )
                    for i, j in enumerate(self.configs)
                ]
            else:
                fcns = [j.get_fcn(vm=vm, batch=batch) for j in self.configs]
        return fcns



[docs]
    def get_fcn(self, datas=None, vm=None, batch=65000):
        if datas is None:
            if vm in self.cached_fcn:
                return self.cached_fcn[vm]
        fcns = self.get_fcns(datas=datas, vm=vm, batch=batch)
        fcn = CombineFCN(fcns=fcns, gauss_constr=self.gauss_constr_dic)
        if datas is None:
            self.cached_fcn[vm] = fcn
        return fcn



[docs]
    def get_args_value(self, bounds_dict):
        args = {}
        args_name = self.vm.trainable_vars
        x0 = []
        bnds = []

        for i in self.vm.trainable_variables:
            args[i.name] = i.numpy()
            x0.append(i.numpy())
            if i.name in bounds_dict:
                bnds.append(bounds_dict[i.name])
            else:
                bnds.append((None, None))
            args["error_" + i.name] = 0.1

        return args_name, x0, args, bnds



[docs]
    @time_print
    def fit(
        self,
        datas=None,
        batch=65000,
        method="BFGS",
        maxiter=None,
        print_init_nll=False,
        callback=None,
        add_fun=None,
        constraints=None,
    ):
        fcn = self.get_fcn(datas=datas)
        if add_fun is not None:
            from tf_pwa.model.model import AddFCN

            add_fun_obj = fcn.vm.build_nll_grad(add_fun)
            fcn = AddFCN(fcn, add_fun_obj)
        # fcn.gauss_constr.update({"Zc_Xm_width": (0.177, 0.03180001857)})
        print("\n########### initial parameters")
        print(json.dumps(fcn.get_params(), indent=2), flush=True)
        if print_init_nll:
            print("initial NLL: ", fcn({}))
        self.fit_params = fit(
            fcn=fcn,
            method=method,
            bounds_dict=self.bound_dic,
            maxiter=maxiter,
            callback=callback,
            constraints=constraints,
        )
        if self.fit_params.hess_inv is not None:
            self.inv_he = self.fit_params.hess_inv
        return self.fit_params



[docs]
    def fit_cons(self, fun, val, k=10000, gauss_first=True, **kwargs):
        return ConfigLoader.fit_cons(
            self, fun, val, k=10000, gauss_first=True, **kwargs
        )



[docs]
    def reinit_params(self):
        self.get_amplitudes()[0].vm.refresh_vars(bound_dic=self.bound_dic)



[docs]
    def get_params_error(
        self, params=None, datas=None, batch=10000, using_cached=False
    ):
        if params is None:
            params = {}
        if hasattr(params, "params"):
            params = getattr(params, "params")

        if using_cached and self.inv_he is not None:
            hesse_error = np.sqrt(np.fabs(self.inv_he.diagonal())).tolist()
        else:
            fcn = self.get_fcn(datas, batch=batch)
            hesse_error, self.inv_he = cal_hesse_error(
                fcn, params, check_posi_def=True, save_npy=True
            )
        # hesse_error, self.inv_he = cal_hesse_error(
        # fcn, params, check_posi_def=True, save_npy=True
        # )
        print("hesse_error:", hesse_error)
        err = dict(zip(self.vm.trainable_vars, hesse_error))
        if hasattr(self, "fit_params"):
            self.fit_params.set_error(err)
        return err



[docs]
    def get_params(self, trainable_only=False):
        # _amps = self.get_fcn()
        return self.vm.get_all_dic(trainable_only)



[docs]
    def set_params(self, params, neglect_params=None):
        _amps = self.get_amplitudes()
        self.configs[0].set_params(params, neglect_params=neglect_params)



[docs]
    @contextlib.contextmanager
    def params_trans(self):
        with self.vm.error_trans(self.inv_he) as f:
            yield f



[docs]
    def save_params(self, file_name):
        params = self.get_params()
        val = {k: float(v) for k, v in params.items()}
        with open(file_name, "w") as f:
            json.dump(val, f, indent=2)


    def _get_plot_partial_wave_input(
        self, params=None, prefix="figure/all", save_root=False, **kwargs
    ):
        path = os.path.dirname(prefix)
        os.makedirs(path, exist_ok=True)

        all_data = []
        extra = None
        for config_i in self.configs:
            for data, extra in config_i._get_plot_partial_wave_input(
                params=params, **kwargs
            ):
                all_data.append(data)

        data_dict = data_to_numpy(data_merge(*[i[0] for i in all_data]))
        bg_dict = data_to_numpy(data_merge(*[i[2] for i in all_data]))

        all_keys = list(all_data[-1][1].keys())
        for idx, i in enumerate(all_data[:-1]):
            phsp = i[1]
            weights_keys = [j for j in phsp.keys() if j.endswith("_fit")]
            tail_keys = [k[k[4:].index("_") + 4 :] for k in weights_keys]
            for k in all_keys:
                if k in phsp or not k.endswith("_fit"):
                    continue
                weights_keys = [j for j in phsp.keys() if j.endswith("_fit")]
                idx_key = k[k[4:].index("_") + 4 :]
                if idx_key in tail_keys:
                    new_name = weights_keys[tail_keys.index(idx_key)]
                    print(
                        "com_plot: use", new_name, "for", k, "for sample", idx
                    )
                    phsp[k] = phsp[new_name]
                else:
                    print("com_plot: set", k, "to 0 for sample", idx)
                    phsp[k] = np.zeros_like(phsp["MC_total_fit"])
        phsp_dict = data_to_numpy(data_merge(*[i[1] for i in all_data]))

        if save_root:
            save_dict_to_root(
                [data_dict, phsp_dict, bg_dict],
                file_name=prefix + "variables_com.root",
                tree_name=["data", "fitted", "sideband"],
            )
            print("Save root file " + prefix + "com_variables.root")

        return (data_dict, phsp_dict, bg_dict), extra


[docs]
    def plot_partial_wave(
        self, params=None, prefix="figure/all", save_root=False, **kwargs
    ):

        data, extra = self._get_plot_partial_wave_input(
            params=params, prefix=prefix, save_root=save_root, **kwargs
        )

        data_dict, phsp_dict, bg_dict = data
        _, plot_var_dic, chain_property, nll = extra

        self.configs[-1]._plot_partial_wave(
            data_dict,
            phsp_dict,
            bg_dict,
            prefix,
            plot_var_dic,
            chain_property,
            nll=nll,
            **kwargs,
        )