Source code for recipes.cpc1.e029_sheffield.evaluate

import json
import logging
from pathlib import Path

import hydra
import numpy as np
from omegaconf import DictConfig
from scipy.optimize import curve_fit
from scipy.stats import kendalltau, pearsonr

logger = logging.getLogger(__name__)

[docs] def rmse_score(x, y): return np.sqrt(np.mean((x - y) ** 2))
[docs] def ncc_score(x, y): return pearsonr(x, y)[0]
[docs] def kt_score(x, y): return kendalltau(x, y)[0]
[docs] def std_err(x, y): return np.std(x - y) / np.sqrt(len(x))
[docs] class Model: """Class to represent the mapping from mbstoi parameters to intelligibility scores. The mapping uses a simple logistic function scaled between 0 and 100. The mapping parameters need to fit first using mbstoi, intelligibility score pairs, using fit(). Once the fit has been made predictions can be made by calling predict() """ params = None # The model params def _logistic_mapping(self, x, x0, k): """ Logistic function x0 - x value of the logistic's midpoint k - the logistic growth rate or steepness of the curve """ L = 100 # correctness can't be over 100 return L / (1 + np.exp(-k * (x - x0)))
[docs] def fit(self, pred, intel): """Fit a mapping betweeen mbstoi scores and intelligibility scores.""" initial_guess = [0.5, 1.0] # Initial guess for parameter values self.params, *_remaining_returns = curve_fit( self._logistic_mapping, pred, intel, initial_guess )
[docs] def predict(self, x): """Predict intelligilbity scores from mbstoi scores.""" # Note, fit() must be called before predictions can be made assert self.params is not None return self._logistic_mapping(x, self.params[0], self.params[1])
[docs] def compute_scores(predictions, labels): return { "RMSE": rmse_score(predictions, labels), "Std": std_err(predictions, labels), "NCC": ncc_score(predictions, labels), "KT": kt_score(predictions, labels), }
[docs] def read_data(pred_json: Path, label_json: Path): # read label_json to dict with"r", encoding="utf-8") as fp: labels = json.load(fp) label_dict = {item["signal"]: item["correctness"] for item in labels} with"r", encoding="utf-8") as fp: pred_dict = json.load(fp) prediction = [pred * 100.0 for pred in pred_dict.values()] label = [label_dict[signal] for signal in pred_dict] return np.array(prediction), np.array(label)
[docs] @hydra.main(config_path=".", config_name="config") def run(cfg: DictConfig) -> None: if cfg.cpc1_track == "open": track = "_indep" elif cfg.cpc1_track == "closed": track = "" else: raise ValueError("cpc1_track has to be closed or open") # encoder representation evaluation prediction_dev, label_dev = read_data( Path(cfg.path.exp_folder) / "dev_conf.json", Path(cfg.path.cpc1_train_data) / f"metadata/CPC1.train{track}.json", ) prediction_test, label_test = read_data( Path(cfg.path.exp_folder) / "test_conf.json", Path(f"../test_listener_responses/CPC1.test{track}.json"), )"Apply logistic fitting.") model = Model(), label_dev) fit_pred = model.predict(prediction_test) conf_scores = compute_scores(fit_pred * 100, label_test * 100) # decoder representation evaluation prediction_dev, label_dev = read_data( Path(cfg.path.exp_folder) / "dev_negent.json", Path(cfg.path.cpc1_train_data) / f"metadata/CPC1.train{track}.json", ) prediction_test, label_test = read_data( Path(cfg.path.exp_folder) / "test_negent.json", Path(f"../test_listener_responses/CPC1.test{track}.json"), )"Apply logistic fitting.") model = Model(), label_dev) fit_pred = model.predict(prediction_test) negent_scores = compute_scores(fit_pred * 100, label_test * 100) results_file = Path(cfg.path.exp_folder) / "results.json" with"w", encoding="utf-8") as fp: json.dump( { "confidence_results": conf_scores, "negative_entropy_results": negent_scores, }, fp, )
# pylint: disable=no-value-for-parameter if __name__ == "__main__": run()