diff --git a/src/scripts/ParitySigma.py b/src/scripts/ParitySigma.py new file mode 100644 index 0000000..2740112 --- /dev/null +++ b/src/scripts/ParitySigma.py @@ -0,0 +1,294 @@ +import os +import yaml +import argparse +import numpy as np +import torch +import matplotlib.pyplot as plt +from utils.config import Config +from utils.defaults import DefaultsAnalysis +from data.data import DataPreparation +from analyze.analyze import AggregateCheckpoints + +# from plots import Plots + + +def parse_args(): + parser = argparse.ArgumentParser(description="data handling module") + # there are three options with the parser: + # 1) Read from a yaml + # 2) Reads from the command line and default file + # and dumps to yaml + + # option to pass name of config + parser.add_argument("--config", "-c", default=None) + + # model + # we need some info about the model to run this analysis + # path to save the model results + parser.add_argument("--dir", + default=DefaultsAnalysis["common"]["dir"]) + # now args for model + parser.add_argument( + "--n_models", + type=int, + default=DefaultsAnalysis["model"]["n_models"], + help="Number of MVEs in the ensemble", + ) + parser.add_argument( + "--BETA", + type=beta_type, + required=False, + default=DefaultsAnalysis["model"]["BETA"], + help="If loss_type is bnn_loss, specify a beta as a float or \ + there are string options: linear_decrease, \ + step_decrease_to_0.5, and step_decrease_to_1.0", + ) + parser.add_argument( + "--COEFF", + type=float, + required=False, + default=DefaultsAnalysis["model"]["COEFF"], + help="COEFF for DER", + ) + parser.add_argument( + "--loss_type", + type=str, + required=False, + default=DefaultsAnalysis["model"]["loss_type"], + help="loss_type for DER, either SDER or DER", + ) + parser.add_argument( + "--noise_level_list", + type=list, + required=False, + default=DefaultsAnalysis["analysis"]["noise_level_list"], + help="Noise levels to compare", + ) + parser.add_argument( + "--model_names_list", + type=list, + required=False, + default=DefaultsAnalysis["analysis"]["model_names_list"], + help="Beginning of name for saved checkpoints and figures", + ) + parser.add_argument( + "--n_epochs", + type=int, + required=False, + default=DefaultsAnalysis["model"]["n_epochs"], + help="number of epochs", + ) + parser.add_argument( + "--plot", + action="store_true", + default=DefaultsAnalysis["analysis"]["plot"], + help="option to plot in notebook", + ) + parser.add_argument( + "--color_list", + type=list, + default=DefaultsAnalysis["plots"]["color_list"], + help="list of named or hexcode colors to use for the noise levels", + ) + parser.add_argument( + "--savefig", + action="store_true", + default=DefaultsAnalysis["analysis"]["savefig"], + help="option to save a figure of the true and predicted values", + ) + parser.add_argument( + "--verbose", + action="store_true", + default=DefaultsAnalysis["analysis"]["verbose"], + help="verbose option for train", + ) + args = parser.parse_args() + args = parser.parse_args() + if args.config is not None: + print("Reading settings from config file", args.config) + config = Config(args.config) + + else: + temp_config = DefaultsAnalysis["common"]["temp_config"] + print( + "Reading settings from cli and default, \ + dumping to temp config: ", + temp_config, + ) + os.makedirs(os.path.dirname(temp_config), exist_ok=True) + + # check if args were specified in cli + input_yaml = { + "common": {"dir": args.dir}, + "model": {"n_models": args.n_models, + "n_epochs": args.n_epochs, + "BETA": args.BETA, + "COEFF": args.COEFF, + "loss_type": args.loss_type}, + "analysis": { + "noise_level_list": args.noise_level_list, + "model_names_list": args.model_names_list, + "plot": args.plot, + "savefig": args.savefig, + "verbose": args.verbose, + }, + "plots": {"color_list": args.color_list}, + # "metrics": {key: {} for key in args.metrics}, + } + + yaml.dump(input_yaml, open(temp_config, "w")) + config = Config(temp_config) + + return config + # return parser.parse_args() + + +def beta_type(value): + if isinstance(value, float): + return value + elif value.lower() == "linear_decrease": + return value + elif value.lower() == "step_decrease_to_0.5": + return value + elif value.lower() == "step_decrease_to_1.0": + return value + else: + raise argparse.ArgumentTypeError( + "BETA must be a float or one of 'linear_decrease', \ + 'step_decrease_to_0.5', 'step_decrease_to_1.0'" + ) + + +if __name__ == "__main__": + config = parse_args() + DEVICE = torch.device("cuda" if torch.cuda.is_available() else "cpu") + noise_list = config.get_item("analysis", "noise_level_list", "Analysis") + color_list = config.get_item("plots", "color_list", "Analysis") + BETA = config.get_item("model", "BETA", "Analysis") + COEFF = config.get_item("model", "COEFF", "Analysis") + loss_type = config.get_item("model", "loss_type", "Analysis") + sigma_list = [] + for noise in noise_list: + sigma_list.append(DataPreparation.get_sigma(noise)) + root_dir = config.get_item("common", "dir", "Analysis") + path_to_chk = root_dir + "checkpoints/" + path_to_out = root_dir + "analysis/" + # check that this exists and if not make it + if not os.path.isdir(path_to_out): + print('does not exist, making dir', path_to_out) + os.mkdir(path_to_out) + else: + print('already exists', path_to_out) + model_name_list = config.get_item("analysis", + "model_names_list", + "Analysis") + print("model list", model_name_list) + print("noise list", noise_list) + chk_module = AggregateCheckpoints() + # make an empty nested dictionary with keys for + # model names followed by noise levels + al_dict = { + model_name: {noise: [] for noise in noise_list} + for model_name in model_name_list + } + al_std_dict = { + model_name: {noise: [] for noise in noise_list} + for model_name in model_name_list + } + n_epochs = config.get_item("model", "n_epochs", "Analysis") + for model in model_name_list: + for noise in noise_list: + # append a noise key + # now run the analysis on the resulting checkpoints + if model[0:3] == "DER": + for epoch in range(n_epochs): + chk = chk_module.load_checkpoint( + model, + noise, + epoch, + DEVICE, + path=path_to_chk, + COEFF=COEFF, + loss=loss_type + ) + # path=path_to_chk) + # things to grab: 'valid_mse' and 'valid_bnll' + epistemic_m, aleatoric_m, e_std, a_std = ( + chk_module.ep_al_checkpoint_DER(chk) + ) + al_dict[model][noise].append(aleatoric_m) + al_std_dict[model][noise].append(a_std) + + else: + n_models = config.get_item("model", "n_models", "DE") + for epoch in range(n_epochs): + list_mus = [] + list_vars = [] + for nmodels in range(n_models): + chk = chk_module.load_checkpoint( + model, + noise, + epoch, + DEVICE, + path=path_to_chk, + BETA=BETA, + nmodel=nmodels, + ) + mu_vals, var_vals = chk_module.ep_al_checkpoint_DE(chk) + list_mus.append(mu_vals) + list_vars.append(var_vals) + al_dict[model][noise].append(np.median(np.mean(list_vars, + axis=0))) + al_std_dict[model][noise].append(np.std(np.mean(list_vars, + axis=0))) + # make a two-paneled plot for the different noise levels + # make one panel per model + # for the noise levels: + plt.clf() + fig = plt.figure(figsize=(10, 4)) + #ax = fig.add_subplot(111) + # try this instead with a fill_between method + sym_list = ['^', '*'] + for m, model in enumerate(model_name_list): + ax = fig.add_subplot(1, len(model_name_list), m + 1) + # Your plotting code for each model here + for i, noise in enumerate(noise_list): + if model[0:3] == "DE_": + # only take the sqrt for the case of DE, + # which is the variance + al = np.array(np.sqrt(al_dict[model][noise])) + al_std = np.array(np.sqrt(al_std_dict[model][noise])) + else: + al = np.array(al_dict[model][noise]) + al_std = np.array(al_std_dict[model][noise]) + # summarize the aleatoric + ax.errorbar(sigma_list[i], + al[-1], + yerr=al_std[-1], + color=color_list[i], + capsize=5) + ax.scatter(sigma_list[i], + al[-1], + color=color_list[i], + label=r"$\sigma = $" + str(sigma_list[i])) + ax.set_ylabel("Aleatoric Uncertainty") + ax.set_xlabel("True (Injected) Uncertainty") + ax.plot(range(0, 14), range(0, 14), ls='--', color='black') + ax.set_ylim([0,14]) + ax.set_xlim([0,14]) + if model[0:3] == "DER": + ax.set_title("Deep Evidential Regression") + elif model[0:2] == "DE": + ax.set_title("Deep Ensemble (100 models)") + plt.legend() + if config.get_item("analysis", "savefig", "Analysis"): + plt.savefig( + str(path_to_out) + + "parity_plot_uncertainty_" + + str(n_epochs) + + "_n_models_DE_" + + str(n_models) + + ".png" + ) + if config.get_item("analysis", "plot", "Analysis"): + plt.show()