added mnist

2026-01-23 18:05:23 +01:00 · 2026-01-23 18:05:23 +01:00 · 839496fb8e
parent a6336218e2
commit 839496fb8e
13 changed files with 748 additions and 305 deletions
--- a/BayesianKDEy/_bayesian_mapls.py
+++ b/BayesianKDEy/_bayesian_mapls.py
@ -295,13 +295,6 @@ def lam_forward(dpq, gamma):
    return gamma * dpq / (1 + gamma * dpq)


-# def kl_div(p, q):
-#     p = np.asarray(p, dtype=np.float32)
-#     q = np.asarray(q + 1e-8, dtype=np.float32)
-#
-#     return np.sum(np.where(p != 0, p * np.log(p / q), 0))
-
-
 def kl_div(p, q, eps=1e-12):
    p = np.asarray(p, dtype=float)
    q = np.asarray(q, dtype=float)
--- a/BayesianKDEy/commons.py
+++ b/BayesianKDEy/commons.py
@ -5,170 +5,16 @@ from pathlib import Path
 from jax import numpy as jnp
 from sklearn.base import BaseEstimator

-import error
-import functional as F
+import quapy.functional as F

 import quapy as qp
 import numpy as np

-from method.aggregative import KDEyML
-from quapy.functional import l1_norm, ILRtransformation
+from quapy.method.aggregative import KDEyML
+from quapy.functional import ILRtransformation
 from scipy.stats import entropy
-from abc import ABC, abstractmethod
-
-
-FINEGRAINED = True
-RESULT_DIR = Path('results_finegrained') if FINEGRAINED else Path('results')
-
-
-class DatasetHandler(ABC):
-
-    def __init__(self, name:str, sample_size:int):
-        self._name = name
-        self._sample_size = sample_size
-
-    @abstractmethod
-    def get_training(self): ...
-
-    @abstractmethod
-    def get_train_testprot_for_eval(self): ...
-
-    @abstractmethod
-    def get_train_valprot_for_modsel(self): ...
-
-    def sample_size(self):
-        return self._sample_size
-
-    def name(self):
-        return self._name
-
-    @classmethod
-    @abstractmethod
-    def iter(cls): ...
-
-    def __repr__(self):
-        return self.__class__.__name__
-
-    @classmethod
-    @abstractmethod
-    def is_binary(self):
-        ...
-
-
-class UCIMulticlassHandler(DatasetHandler):
-
-    DATASETS = qp.datasets.UCI_MULTICLASS_DATASETS.copy()
-
-    def __init__(self, name, n_val_samples=100, n_test_samples=100):
-        super().__init__(name, sample_size=1000)
-        self._dataset = None  # lazy fetch
-        self.n_val_samples = n_val_samples
-        self.n_test_samples = n_test_samples
-
-    def get_training(self):
-        return self.dataset().training
-
-    def get_train_testprot_for_eval(self):
-        training, test = self.dataset().train_test
-        test_generator = qp.protocol.UPP(test, repeats=self.n_test_samples, random_state=0)
-        return training, test_generator
-
-    def get_train_valprot_for_modsel(self):
-        training = self.dataset().training
-        training, val = training.split_stratified(train_prop=0.6, random_state=0)
-        val_generator = qp.protocol.UPP(val, repeats=self.n_val_samples, random_state=0)
-        return training, val_generator
-
-    @lru_cache(maxsize=None)
-    def dataset(self):
-        if self._dataset is None:
-            self._dataset = qp.datasets.fetch_UCIMulticlassDataset(self.name(), min_class_support=0.01)
-        return self._dataset
-
-    def __repr__(self):
-        return "" # self.dataset().__repr__()
-
-    @classmethod
-    def iter(cls):
-        for name in cls.DATASETS:
-            yield cls(name)
-
-    @classmethod
-    def is_binary(self):
-        return False
-
-
-class LeQuaHandler(DatasetHandler):
-
-    DATASETS = ['LeQua2022', 'LeQua2024']
-
-    def __init__(self, name):
-        super().__init__(name, sample_size=1000)
-        self._dataset = None  # lazy fetch
-
-    def get_training(self):
-        return self.dataset()[0]
-
-    def get_train_testprot_for_eval(self):
-        training, _, test_generator = self.dataset()
-        return training, test_generator
-
-    def get_train_valprot_for_modsel(self):
-        training, val_generator, _ = self.dataset()
-        return training, val_generator
-
-    @lru_cache(maxsize=None)
-    def dataset(self):
-        if self._dataset is None:
-            if self.name()=='LeQua2022':
-                self._dataset = qp.datasets.fetch_lequa2022(task='T1B')
-            elif self.name()=='LeQua2024':
-                self._dataset = qp.datasets.fetch_lequa2024(task='T2')
-            else:
-                raise ValueError(f'unexpected dataset name {self.name()}; valid ones are {self.DATASETS}')
-        return self._dataset
-
-    def __repr__(self):
-        return self.dataset().__repr__()
-
-    @classmethod
-    def iter(cls):
-        for name in cls.DATASETS:
-            yield cls(name)
-
-    @classmethod
-    def is_binary(self):
-        return False
-
-# def fetch_UCI_multiclass(data_name):
-#     return qp.datasets.fetch_UCIMulticlassDataset(data_name, min_class_support=0.01)
-
-
-def fetch_UCI_binary(data_name):
-    return qp.datasets.fetch_UCIBinaryDataset(data_name)
-
-# global configurations
-
-binary = {
-    'datasets': qp.datasets.UCI_BINARY_DATASETS.copy(),
-    'fetch_fn': fetch_UCI_binary,
-    'sample_size': 500
-}
-
-# multiclass = {
-#     'datasets': qp.datasets.UCI_MULTICLASS_DATASETS.copy(),
-#     'fetch_fn': fetch_UCI_multiclass,
-#     'sample_size': 1000
-# }
-# try:
-#     multiclass['datasets'].remove('poker_hand')  # random performance
-#     multiclass['datasets'].remove('hcv')  # random performance
-#     multiclass['datasets'].remove('letter')  # many classes
-#     multiclass['datasets'].remove('isolet')  # many classes
-# except ValueError:
-#     pass
-

+RESULT_DIR = Path('results')


 # utils
@ -266,5 +112,25 @@ class ILRtransformation(F.CompositionalTransformation):
        return ilr_basis(k)


-def in_simplex(x):
-    return np.all(x >= 0) and np.isclose(x.sum(), 1)
+def in_simplex(x, atol=1e-8):
+    x = np.asarray(x)
+
+    non_negative = np.all(x >= 0, axis=-1)
+    sum_to_one = np.isclose(x.sum(axis=-1), 1.0, atol=atol)
+
+    return non_negative & sum_to_one
+
+
+class MockClassifierFromPosteriors(BaseEstimator):
+    def __init__(self):
+        pass
+
+    def fit(self, X, y):
+        self.classes_ = sorted(np.unique(y))
+        return self
+
+    def predict(self, X):
+        return np.argmax(X, axis=1)
+
+    def predict_proba(self, X):
+        return X
--- a/BayesianKDEy/data/mnist_basiccnn/info_mnist_basiccnn.txt
+++ b/BayesianKDEy/data/mnist_basiccnn/info_mnist_basiccnn.txt
@ -0,0 +1,39 @@
+Dataset: mnist
+Model: basiccnn
+Number of classes: 10
+Train samples: 42000
+Validation samples: 18000
+Test samples: 10000
+Validation accuracy: 0.9895
+Test accuracy: 0.9901
+Github repository: ....
+
+Data Loading Instructions:
+The extracted features, predictions, targets, and logits are saved in .npz files.
+To load the data in Python:
+
+import numpy as np
+
+# Load training data
+train_data = np.load('mnist_basiccnn_train_out.npz')
+train_features = train_data['features']
+train_predictions = train_data['predictions']
+train_targets = train_data['targets']
+train_logits = train_data['logits']
+
+# Load validation data
+val_data = np.load('mnist_basiccnn_val_out.npz')
+val_features = val_data['features']
+val_predictions = val_data['predictions']
+val_targets = val_data['targets']
+val_logits = val_data['logits']
+
+# Load test data
+test_data = np.load('mnist_basiccnn_test_out.npz')
+test_features = test_data['features']
+test_predictions = test_data['predictions']
+test_targets = test_data['targets']
+test_logits = test_data['logits']
+
+Note: features are the output of the feature extractor (before the final classification layer),
+predictions are softmax probabilities, targets are the true labels, and logits are the raw model outputs.
--- a/BayesianKDEy/data/mnist_basiccnn/mnist_basiccnn_test_out.npz
+++ b/BayesianKDEy/data/mnist_basiccnn/mnist_basiccnn_test_out.npz
--- a/BayesianKDEy/data/mnist_basiccnn/mnist_basiccnn_train_out.npz
+++ b/BayesianKDEy/data/mnist_basiccnn/mnist_basiccnn_train_out.npz
--- a/BayesianKDEy/data/mnist_basiccnn/mnist_basiccnn_val_out.npz
+++ b/BayesianKDEy/data/mnist_basiccnn/mnist_basiccnn_val_out.npz
--- a/BayesianKDEy/datasets.py
+++ b/BayesianKDEy/datasets.py
@ -0,0 +1,270 @@
+import inspect
+from abc import ABC, abstractmethod
+from functools import lru_cache
+
+import numpy as np
+from pathlib import Path
+import quapy as qp
+
+from commons import MockClassifierFromPosteriors
+from quapy.protocol import UPP
+from quapy.data import LabelledCollection
+from quapy.method.aggregative import EMQ
+
+
+def fetchMNIST(modality, data_home='./data/mnist_basiccnn'):
+    MODALITY = ('features', 'predictions', 'logits')
+    assert modality in MODALITY, f'unknown modality, valid ones are {MODALITY}'
+
+    data_home = Path(data_home)
+
+    # Load training data
+    train_data = np.load(data_home/'mnist_basiccnn_train_out.npz')
+    train_X = train_data[modality]
+    train_y = train_data['targets']
+
+    # Load validation data
+    val_data = np.load(data_home/'mnist_basiccnn_val_out.npz')
+    val_X = val_data[modality]
+    val_y = val_data['targets']
+
+    # Load test data
+    test_data = np.load(data_home/'mnist_basiccnn_test_out.npz')
+    test_X = test_data[modality]
+    test_y = test_data['targets']
+
+    print(f'loaded MNIST ({modality=}): '
+          f'#train={len(train_y)}, #val={len(val_y)}, #test={len(test_y)}, #features={train_X.shape[1]}')
+
+    train = LabelledCollection(train_X, train_y)
+    val = LabelledCollection(val_X, val_y, classes=train.classes_)
+    test = LabelledCollection(test_X, test_y, classes=train.classes_)
+
+    return train, val, test
+
+
+
+class DatasetHandler(ABC):
+
+    def __init__(self, name):
+        self.name = name
+
+    @classmethod
+    def get_defaults(cls):
+        sig = inspect.signature(cls.__init__)
+
+        defaults = {
+            name: param.default
+            for name, param in sig.parameters.items()
+            if param.default is not inspect.Parameter.empty
+        }
+
+        return defaults
+
+    @abstractmethod
+    def get_training(self): ...
+
+    @abstractmethod
+    def get_train_testprot_for_eval(self): ...
+
+    @abstractmethod
+    def get_train_valprot_for_modsel(self): ...
+
+    @classmethod
+    @abstractmethod
+    def get_datasets(cls): ...
+
+    @classmethod
+    def iter(cls, **kwargs):
+        for name in cls.get_datasets():
+            yield cls(name, **kwargs)
+
+    def __repr__(self):
+        return f'{self.__class__.__name__}({self.name})'
+
+    @classmethod
+    @abstractmethod
+    def is_binary(self):  ...
+
+
+class MNISTHandler(DatasetHandler):
+
+    def __init__(self, n_val_samples=100, n_test_samples=100, sample_size=500, random_state=0):
+        super().__init__(name='MNIST')
+        self.n_val_samples = n_val_samples
+        self.n_test_samples = n_test_samples
+        self.sample_size = sample_size
+        self.random_state = random_state
+
+    @lru_cache(maxsize=None)
+    def dataset(self):
+        return fetchMNIST(modality='predictions')
+
+    def get_training(self):
+        return self.dataset()[0]
+
+    def get_validation(self):
+        return self.dataset()[1]
+
+    def get_train_testprot_for_eval(self):
+        # note that the training goes on the validation split, since the proper training was used for training the neural network
+        _, val, test = self.dataset()
+        test_prot = UPP(test, sample_size=self.sample_size, repeats=self.n_test_samples, random_state=self.random_state)
+        return val, test_prot
+
+    def get_train_valprot_for_modsel(self):
+        # the training split is never used (was used to train a neural model)
+        # we consider the validation split as our training data, so we return a new split on it
+        _, val, _ = self.dataset()
+        train, val = val.split_stratified(train_prop=0.6, random_state=self.random_state)
+        val_prot = UPP(val, sample_size=self.sample_size, repeats=self.n_val_samples, random_state=self.random_state)
+        return train, val_prot
+
+    @classmethod
+    def get_datasets(cls):
+        return ['MNIST']
+
+    @classmethod
+    def iter(cls, **kwargs):
+        yield cls(**kwargs)
+
+    def __repr__(self):
+        return f'{self.name}'
+
+    @classmethod
+    def is_binary(self):
+        return False
+
+
+# LeQua multiclass tasks
+class LeQuaHandler(DatasetHandler):
+
+    DATASETS = ['LeQua2022', 'LeQua2024']
+
+    def __init__(self, name):
+        super().__init__(name)
+        self.sample_size = 1000
+
+    def get_training(self):
+        return self.dataset()[0]
+
+    def get_train_testprot_for_eval(self):
+        training, _, test_generator = self.dataset()
+        return training, test_generator
+
+    def get_train_valprot_for_modsel(self):
+        training, val_generator, _ = self.dataset()
+        return training, val_generator
+
+    @lru_cache(maxsize=None)
+    def dataset(self):
+        if self.name=='LeQua2022':
+            return qp.datasets.fetch_lequa2022(task='T1B')
+        elif self.name=='LeQua2024':
+            return qp.datasets.fetch_lequa2024(task='T2')
+        else:
+            raise ValueError(f'unexpected dataset name {self.name}; valid ones are {self.DATASETS}')
+
+    def __repr__(self):
+        return self.name
+
+    @classmethod
+    def iter(cls):
+        for name in cls.DATASETS:
+            yield cls(name)
+
+    @classmethod
+    def is_binary(self):
+        return False
+
+    @classmethod
+    def get_datasets(cls):
+        return cls.DATASETS
+
+
+class UCIDatasetHandler(DatasetHandler, ABC):
+    DATASETS = []
+
+    def __init__(self, name, n_val_samples, n_test_samples, sample_size, random_state):
+        super().__init__(name=name)
+        self.sample_size = sample_size
+        self.n_val_samples = n_val_samples
+        self.n_test_samples = n_test_samples
+        self.random_state = random_state
+
+    def get_training(self):
+        return self.dataset().training
+
+    def get_train_testprot_for_eval(self):
+        training, test = self.dataset().train_test
+        test_generator = qp.protocol.UPP(test, sample_size=self.sample_size, repeats=self.n_test_samples,
+                                         random_state=self.random_state)
+        return training, test_generator
+
+    def get_train_valprot_for_modsel(self):
+        training = self.dataset().training
+        training, val = training.split_stratified(train_prop=0.6, random_state=self.random_state)
+        val_generator = qp.protocol.UPP(val, sample_size=self.sample_size, repeats=self.n_val_samples,
+                                        random_state=self.random_state)
+        return training, val_generator
+
+    @classmethod
+    def get_datasets(cls):
+        return cls.DATASETS
+
+    @classmethod
+    def iter(cls):
+        for name in cls.DATASETS:
+            yield cls(name)
+
+
+class UCIMulticlassHandler(UCIDatasetHandler):
+
+    DATASETS = [d for d in qp.datasets.UCI_MULTICLASS_DATASETS if d not in frozenset(['hcv', 'poker_hand'])]
+
+    def __init__(self, name, n_val_samples=100, n_test_samples=100, sample_size=1000, random_state=0):
+        super().__init__(name, n_val_samples, n_test_samples, sample_size, random_state)
+
+    @lru_cache(maxsize=None)
+    def dataset(self):
+        return qp.datasets.fetch_UCIMulticlassDataset(self.name, min_class_support=0.01)
+
+    def __repr__(self):
+        return f'{self.name}(UCI-multiclass)'
+
+    @classmethod
+    def is_binary(self):
+        return False
+
+
+class UCIBinaryHandler(DatasetHandler):
+
+    DATASETS = qp.datasets.UCI_BINARY_DATASETS.copy()
+
+    def __init__(self, name, n_val_samples=100, n_test_samples=100, sample_size=500, random_state=0):
+        super().__init__(name, n_val_samples, n_test_samples, sample_size, random_state)
+
+    @lru_cache(maxsize=None)
+    def dataset(self):
+        return qp.datasets.fetch_UCIBinaryDataset(self.name)
+
+    def __repr__(self):
+        return f'{self.name}(UCI-binary)'
+
+
+    @classmethod
+    def is_binary(self):
+        return True
+
+
+if __name__ == '__main__':
+    train, val, test = fetchMNIST(modality='predictions')
+    cls = MockClassifierFromPosteriors()
+    cls.fit(*train.Xy)
+    # q = KDEyML(classifier=cls, fit_classifier=False)
+    # q = PACC(classifier=cls, fit_classifier=False)
+    q = EMQ(classifier=cls, fit_classifier=False)
+    q.fit(*val.Xy)
+    test_prot = UPP(test, repeats=100, sample_size=500)
+    report = qp.evaluation.evaluation_report(q, test_prot, verbose=True)
+    print(report.mean(numeric_only=True))
--- a/BayesianKDEy/full_experiments.py
+++ b/BayesianKDEy/full_experiments.py
@ -1,13 +1,14 @@
 from pathlib import Path

-from sklearn.linear_model import LogisticRegression as LR
+from sklearn.linear_model import LogisticRegression
 from copy import deepcopy as cp
 import quapy as qp
-from BayesianKDEy._bayeisan_kdey import BayesianKDEy
-from BayesianKDEy._bayesian_mapls import BayesianMAPLS
-from BayesianKDEy.commons import experiment_path, KDEyCLR, FINEGRAINED, RESULT_DIR, DatasetHandler, \
-    UCIMulticlassHandler, LeQuaHandler
-from BayesianKDEy.temperature_calibration import temp_calibration
+from _bayeisan_kdey import BayesianKDEy
+from _bayesian_mapls import BayesianMAPLS
+from commons import experiment_path, KDEyCLR, RESULT_DIR, MockClassifierFromPosteriors
+# import datasets
+from datasets import LeQuaHandler, UCIMulticlassHandler, DatasetHandler, MNISTHandler
+from temperature_calibration import temp_calibration
 from build.lib.quapy.data import LabelledCollection
 from quapy.method.aggregative import DistributionMatchingY as DMy, AggregativeQuantifier, EMQ, CC
 from quapy.model_selection import GridSearchQ
@ -22,7 +23,7 @@ from time import time



-def methods():
+def methods(data_handler: DatasetHandler):
    """
    Returns a tuple (name, quantifier, hyperparams, bayesian/bootstrap_constructor), where:
    - name: is a str representing the name of the method (e.g., 'BayesianKDEy')
@ -31,46 +32,49 @@ def methods():
    - bayesian/bootstrap_constructor: is a function that instantiates the bayesian o bootstrap method with the
        quantifier with optimized hyperparameters
    """
-    if FINEGRAINED:
-        lr_hyper = {'classifier__C': np.logspace(-4,4,9), 'classifier__class_weight': ['balanced', None]}
-        acc_hyper = lr_hyper
-        emq_hyper = {'calib': ['nbvs', 'bcts', 'ts', 'vs'], **lr_hyper}
-        hdy_hyper = {'nbins': [3,4,5,8,16,32], **lr_hyper}
-        kdey_hyper = {'bandwidth': np.logspace(-3, -1, 10), **lr_hyper}
-        kdey_hyper_clr = {'bandwidth': np.logspace(-2, 2, 10), **lr_hyper}
+    if isinstance(data_handler, MNISTHandler):
+        Cls = MockClassifierFromPosteriors
+        cls_hyper = {}
+        val_split = data_handler.get_validation().Xy  # use this specific collection
    else:
-        acc_hyper = {}
-        emq_hyper = {'calib': ['nbvs', 'bcts', 'ts', 'vs']}
-        hdy_hyper = {'nbins': [3,4,5,8,16,32]}
-        kdey_hyper = {'bandwidth': [0.001, 0.005, 0.01, 0.05, 0.1, 0.2]}
-        kdey_hyper_clr = {'bandwidth': [0.05, 0.1, 0.5, 1., 2., 5.]}
-
+        Cls = LogisticRegression
+        cls_hyper = {'classifier__C': np.logspace(-4,4,9), 'classifier__class_weight': ['balanced', None]}
+        val_split = 5  # k-fold cross-validation
+    acc_hyper = cls_hyper
+    # emq_hyper = {'calib': ['nbvs', 'bcts', 'ts', 'vs'], **cls_hyper}
+    hdy_hyper = {'nbins': [3,4,5,8,16,32], **cls_hyper}
+    kdey_hyper = {'bandwidth': np.logspace(-3, -1, 10), **cls_hyper}
+    kdey_hyper_clr = {'bandwidth': np.logspace(-2, 2, 10), **cls_hyper}

    multiclass_method = 'multiclass'
    only_binary = 'only_binary'
    only_multiclass = 'only_multiclass'

+    # surrogate quantifiers
+    acc = ACC(Cls(), val_split=val_split)
+    hdy = DMy(Cls(), val_split=val_split)
+    kde_gau = KDEyML(Cls(), val_split=val_split)
+    kde_ait = KDEyCLR(Cls(), val_split=val_split)
+    emq = EMQ(Cls(), exact_train_prev=False, val_split=val_split)
+
+
    # Bootstrap approaches:
    # --------------------------------------------------------------------------------------------------------
-    #yield 'BootstrapACC', ACC(LR()), acc_hyper, lambda hyper: AggregativeBootstrap(ACC(LR()), n_test_samples=1000, random_state=0), multiclass_method
-    #yield 'BootstrapEMQ', EMQ(LR(), on_calib_error='backup', val_split=5), emq_hyper, lambda hyper: AggregativeBootstrap(EMQ(LR(), on_calib_error='backup', calib=hyper['calib'], val_split=5), n_test_samples=1000, random_state=0), multiclass_method
-    #yield 'BootstrapHDy', DMy(LR()), hdy_hyper, lambda hyper: AggregativeBootstrap(DMy(LR(), **hyper), n_test_samples=1000, random_state=0), multiclass_method
-    #yield 'BootstrapKDEy', KDEyML(LR()), kdey_hyper, lambda hyper: AggregativeBootstrap(KDEyML(LR(), **hyper), n_test_samples=1000, random_state=0, verbose=True), multiclass_method
+    #yield 'BootstrapACC', acc, acc_hyper, lambda hyper: _AggregativeBootstrap(ACC(Cls()), n_test_samples=1000, random_state=0), multiclass_method
+    #yield 'BootstrapEMQ', emq, on_calib_error='backup', val_split=5), emq_hyper, lambda hyper: _AggregativeBootstrap(EMQ(Cls(), on_calib_error='backup', calib=hyper['calib'], val_split=5), n_test_samples=1000, random_state=0), multiclass_method
+    #yield 'BootstrapHDy', hdy, hdy_hyper, lambda hyper: _AggregativeBootstrap(DMy(Cls(), **hyper), n_test_samples=1000, random_state=0), multiclass_method
+    #yield 'BootstrapKDEy', kde_gau, kdey_hyper, lambda hyper: _AggregativeBootstrap(KDEyML(Cls(), **hyper), n_test_samples=1000, random_state=0, verbose=True), multiclass_method

    # Bayesian approaches:
    # --------------------------------------------------------------------------------------------------------
-    # yield 'BayesianACC', ACC(LR()), acc_hyper, lambda hyper: BayesianCC(LR(), mcmc_seed=0), multiclass_method
-    # yield 'BayesianHDy', DMy(LR()), hdy_hyper, lambda hyper: PQ(LR(), stan_seed=0, **hyper), only_binary
-    #
-    #yield f'BaKDE-numpyro', KDEyML(LR()), kdey_hyper, lambda hyper: BayesianKDEy(mcmc_seed=0, engine='numpyro', **hyper), multiclass_method
-    # yield f'BaKDE-numpyro-T2', KDEyML(LR()), kdey_hyper, lambda hyper: BayesianKDEy(mcmc_seed=0, engine='numpyro', temperature=2., **hyper), multiclass_method
-    # yield f'BaKDE-numpyro-T*', KDEyML(LR()), kdey_hyper, lambda hyper: BayesianKDEy(mcmc_seed=0, engine='numpyro', temperature=None, **hyper), multiclass_method
-    #yield f'BaKDE-Ait-numpyro', KDEyCLR(LR()), kdey_hyper_clr, lambda hyper: BayesianKDEy(LR(), kernel='aitchison', mcmc_seed=0, engine='numpyro',  **hyper), multiclass_method
-    # yield f'BaKDE-Gau-numpyro', KDEyML(LR()), kdey_hyper, lambda hyper: BayesianKDEy(LR(), kernel='gaussian', mcmc_seed=0, engine='numpyro',  **hyper), multiclass_method
-    # yield f'BaKDE-Ait-T*', KDEyCLR(LR()), kdey_hyper_clr, lambda hyper: BayesianKDEy(LR(),kernel='aitchison', mcmc_seed=0, engine='numpyro', temperature=None, **hyper), multiclass_method
-    # yield f'BaKDE-Gau-T*', KDEyML(LR()), kdey_hyper, lambda hyper: BayesianKDEy(LR(), kernel='gaussian', mcmc_seed=0, engine='numpyro', temperature=None, **hyper), multiclass_method
-    yield 'BayEMQ-U-Temp1-2', CC(LR()), acc_hyper, lambda hyper: BayesianMAPLS(LR(), prior='uniform', temperature=1, exact_train_prev=True), multiclass_method
-    yield 'BayEMQ-T*', CC(LR()), acc_hyper, lambda hyper: BayesianMAPLS(LR(), prior='uniform', temperature=None, exact_train_prev=True), multiclass_method
+    # yield 'BayesianACC', acc, acc_hyper, lambda hyper: BayesianCC(Cls(), val_split=val_split, mcmc_seed=0), multiclass_method
+    #yield 'BayesianHDy', hdy, hdy_hyper, lambda hyper: PQ(Cls(), val_split=val_split, stan_seed=0, **hyper), only_binary
+    yield f'BaKDE-Ait-numpyro', kde_ait, kdey_hyper_clr, lambda hyper: BayesianKDEy(Cls(), kernel='aitchison', mcmc_seed=0, engine='numpyro', val_split=val_split,  **hyper), multiclass_method
+    yield f'BaKDE-Gau-numpyro', kde_gau, kdey_hyper, lambda hyper: BayesianKDEy(Cls(), kernel='gaussian', mcmc_seed=0, engine='numpyro', val_split=val_split,  **hyper), multiclass_method
+    yield f'BaKDE-Ait-T*', kde_ait, kdey_hyper_clr, lambda hyper: BayesianKDEy(Cls(),kernel='aitchison', mcmc_seed=0, engine='numpyro', temperature=None, val_split=val_split, **hyper), multiclass_method
+    yield f'BaKDE-Gau-T*', kde_gau, kdey_hyper, lambda hyper: BayesianKDEy(Cls(), kernel='gaussian', mcmc_seed=0, engine='numpyro', temperature=None, val_split=val_split, **hyper), multiclass_method
+    # yield 'BayEMQ', emq, acc_hyper, lambda hyper: BayesianMAPLS(Cls(), prior='uniform', temperature=1, exact_train_prev=False, val_split=val_split), multiclass_method
+    # yield 'BayEMQ*', emq, acc_hyper, lambda hyper: BayesianMAPLS(Cls(), prior='uniform', temperature=None, exact_train_prev=False, val_split=val_split), multiclass_method


 def model_selection(dataset: DatasetHandler, point_quantifier: AggregativeQuantifier, grid: dict):
@ -95,11 +99,21 @@ def model_selection(dataset: DatasetHandler, point_quantifier: AggregativeQuanti


 def temperature_calibration(dataset: DatasetHandler, uncertainty_quantifier):
-    if hasattr(uncertainty_quantifier, 'temperature') and uncertainty_quantifier.temperature is None:
-        print('calibrating temperature')
-        train, val_prot = dataset.get_train_valprot_for_modsel()
-        temperature = temp_calibration(uncertainty_quantifier, train, val_prot, n_jobs=-1)
-        uncertainty_quantifier.temperature = temperature
+    temperature = None
+    if hasattr(uncertainty_quantifier, 'temperature'): 
+        if uncertainty_quantifier.temperature is None:
+            print('calibrating temperature')
+            train, val_prot = dataset.get_train_valprot_for_modsel()
+            if dataset.name.startswith('LeQua'):            
+                temp_grid=[100., 500, 1000, 5_000, 10_000, 50_000]
+            else:
+                temp_grid=[.5, 1., 1.5, 2., 5., 10., 100.]
+            temperature = temp_calibration(uncertainty_quantifier, train, val_prot, temp_grid=temp_grid, n_jobs=-1)
+            uncertainty_quantifier.temperature = temperature
+        else:
+            temperature = uncertainty_quantifier.temperature
+    return temperature
+    


 def experiment(dataset: DatasetHandler, point_quantifier: AggregativeQuantifier, method_name:str, grid: dict, uncertainty_quant_constructor, hyper_choice_path: Path):
@ -113,7 +127,7 @@ def experiment(dataset: DatasetHandler, point_quantifier: AggregativeQuantifier,

        t_init = time()
        uncertainty_quantifier = uncertainty_quant_constructor(best_hyperparams)
-        temperature_calibration(dataset, uncertainty_quantifier)
+        temperature = temperature_calibration(dataset, uncertainty_quantifier)
        training, test_generator = dataset.get_train_testprot_for_eval()
        uncertainty_quantifier.fit(*training.Xy)
        tr_time = time() - t_init
@ -144,7 +158,8 @@ def experiment(dataset: DatasetHandler, point_quantifier: AggregativeQuantifier,
            'optim_hyper': best_hyperparams,
            'train_time': tr_time,
            'train-prev': train_prevalence,
-            'results': {k:np.asarray(v) for k,v in results.items()}
+            'results': {k:np.asarray(v) for k,v in results.items()},
+            'temperature': temperature
        }

        return report
@ -162,25 +177,25 @@ if __name__ == '__main__':

    result_dir = RESULT_DIR

-    for data_handler in [LeQuaHandler]:#, UCIMulticlassHandler]:
+    for data_handler in [MNISTHandler]:#, UCIMulticlassHandler,LeQuaHandler]:
        for dataset in data_handler.iter():
-            qp.environ['SAMPLE_SIZE'] = dataset.sample_size()
-            print(f'dataset={dataset}')
+            qp.environ['SAMPLE_SIZE'] = dataset.sample_size
+            print(f'dataset={dataset.name}')

            problem_type = 'binary' if dataset.is_binary() else 'multiclass'

-            for method_name, surrogate_quant, hyper_params, withconf_constructor, method_scope in methods():
+            for method_name, surrogate_quant, hyper_params, withconf_constructor, method_scope in methods(dataset):
                if check_skip_experiment(method_scope, dataset):
                    continue

-                result_path = experiment_path(result_dir / problem_type, dataset.name(), method_name)
-                hyper_path  = experiment_path(result_dir / 'hyperparams' / problem_type, dataset.name(), surrogate_quant.__class__.__name__)
+                result_path = experiment_path(result_dir / problem_type, dataset.name, method_name)
+                hyper_path  = experiment_path(result_dir / 'hyperparams' / problem_type, dataset.name, surrogate_quant.__class__.__name__)

                report = qp.util.pickled_resource(
                    result_path, experiment, dataset, surrogate_quant, method_name, hyper_params, withconf_constructor, hyper_path
                )

-                print(f'dataset={dataset}, '
+                print(f'dataset={dataset.name}, '
                      f'method={method_name}: '
                      f'mae={report["results"]["ae"].mean():.5f}, '
                      f'W={report["results"]["sre"].mean():.5f}, '
--- a/BayesianKDEy/generate_results.py
+++ b/BayesianKDEy/generate_results.py
@ -7,7 +7,8 @@ import pandas as pd
 from glob import glob
 from pathlib import Path
 import quapy as qp
-from BayesianKDEy.commons import RESULT_DIR, UCIMulticlassHandler
+from BayesianKDEy.commons import RESULT_DIR
+from BayesianKDEy.datasets import LeQuaHandler, UCIMulticlassHandler, MNISTHandler
 from error import dist_aitchison
 from quapy.method.confidence import ConfidenceIntervals
 from quapy.method.confidence import ConfidenceEllipseSimplex, ConfidenceEllipseCLR, ConfidenceEllipseILR, ConfidenceIntervals, ConfidenceRegionABC
@ -23,23 +24,14 @@ pd.set_option("display.float_format", "{:.4f}".format)

 # methods = None  # show all methods
 methods = ['BayesianACC',
-           #'BayesianKDEy',
-           #'BaKDE-emcee',
-           # 'BaKDE-numpyro',
-           # 'BaKDE-numpyro-T2',
-           # 'BaKDE-numpyro-T10',
-           # 'BaKDE-numpyro-T*',
           'BaKDE-Ait-numpyro',
           'BaKDE-Ait-T*',
           'BaKDE-Gau-numpyro',
           'BaKDE-Gau-T*',
-           'BayEMQ-U-Temp1-2',
-           'BayEMQ-T*',
-           #'BayEMQ-NoInit',
-           #'BayEMQ-U-Temp*',
-           # 'BayEMQ*2Temp1',
-           # 'BayEMQ*2Temp*'
-
+           # 'BayEMQ-U-Temp1-2',
+           # 'BayEMQ-T*',
+           'BayEMQ',
+           'BayEMQ*',
           # 'BootstrapACC',
           # 'BootstrapHDy',
           # 'BootstrapKDEy',
@ -111,8 +103,9 @@ def nicer(name:str):
    replacements = {
        'Bayesian': 'Ba',
        'Bootstrap': 'Bo',
-        'numpyro': 'ro',
+        '-numpyro': '',
        'emcee': 'emc',
+        '-T*': '*'
    }
    for k, v in replacements.items():
        name = name.replace(k,v)
@ -121,14 +114,19 @@ def nicer(name:str):

 base_dir = RESULT_DIR

-for dataset_handler in [UCIMulticlassHandler]:
+table = defaultdict(list)
+n_classes = {}
+tr_size   = {}
+tr_prev   = {}
+
+for dataset_handler in [UCIMulticlassHandler, LeQuaHandler, MNISTHandler]:
    problem_type = 'binary' if dataset_handler.is_binary() else 'multiclass'
    path = f'./{base_dir}/{problem_type}/*.pkl'
-    table = defaultdict(list)
+    
    for file in tqdm(glob(path), desc='processing results', total=len(glob(path))):
        file = Path(file)
        dataset, method = file.name.replace('.pkl', '').split('__')
-        if method not in methods:
+        if (method not in methods) or (dataset not in dataset_handler.get_datasets()):
            continue

        report = pickle.load(open(file, 'rb'))
@ -171,48 +169,40 @@ for dataset_handler in [UCIMulticlassHandler]:
        #     [region_score(true_prev, ConfidenceEllipseILR(samples)) for true_prev, samples in zip(results['true-prevs'], results['samples'])]
        # )

-
-
-    df = pd.DataFrame(table)
-
-    n_classes = {}
-    tr_size   = {}
-    tr_prev   = {}
    for dataset in dataset_handler.iter():
        train = dataset.get_training()
-        n_classes[dataset] = train.n_classes
-        tr_size[dataset] = len(train)
-        tr_prev[dataset] = F.strprev(train.prevalence())
+        n_classes[dataset.name] = train.n_classes
+        tr_size[dataset.name] = len(train)
+        tr_prev[dataset.name] = F.strprev(train.prevalence())

-    # remove datasets with more than max_classes classes
-    # max_classes = 25
-    # min_train   = 500
-    # ignore_datasets = ['poker_hand', 'hcv']
-    # for data_name, n in n_classes.items():
-    #     if n > max_classes:
-    #         df = df[df["dataset"] != data_name]
-    # for data_name, n in tr_size.items():
-    #     if n < min_train:
-    #         df = df[df["dataset"] != data_name]
-    # for data_name, n in tr_size.items():
-    #     if data_name in ignore_datasets:
-    #         df = df[df["dataset"] != data_name]
+# remove datasets with more than max_classes classes
+# max_classes = 25
+# min_train   = 500
+# ignore_datasets = ['poker_hand', 'hcv']
+# for data_name, n in n_classes.items():
+#     if n > max_classes:
+#         df = df[df["dataset"] != data_name]
+# for data_name, n in tr_size.items():
+#     if n < min_train:
+#         df = df[df["dataset"] != data_name]
+# for data_name, n in tr_size.items():
+#     if data_name in ignore_datasets:
+#         df = df[df["dataset"] != data_name]

-    for region in ['CI']: #, 'CLR', 'ILR', 'CI']:
-        if problem_type == 'binary' and region=='ILR':
-            continue
-        # pv = pd.pivot_table(
-        #     df, index='dataset', columns='method', values=['ae', f'c-{region}', f'a-{region}'], margins=True
-        # )
-        for column in [f'a-{region}', f'c-{region}', 'ae', 'SRE']:
-            pv = pd.pivot_table(
-                df, index='dataset', columns='method', values=column, margins=True
-            )
-            pv['n_classes'] = pv.index.map(n_classes).astype('Int64')
-            pv['tr_size'] = pv.index.map(tr_size).astype('Int64')
-            #pv['tr-prev'] = pv.index.map(tr_prev)
-            pv = pv.drop(columns=[col for col in pv.columns if col[-1] == "All"])
-            print(f'{problem_type=} {column=}')
-            print(pv)
-            print('-'*80)
+
+df = pd.DataFrame(table)
+for region in ['CI']: #, 'CLR', 'ILR', 'CI']:
+    if problem_type == 'binary' and region=='ILR':
+        continue
+    for column in [f'a-{region}', f'c-{region}', 'ae', 'SRE']:
+        pv = pd.pivot_table(
+            df, index='dataset', columns='method', values=column, margins=True
+        )
+        pv['n_classes'] = pv.index.map(n_classes).astype('Int64')
+        pv['tr_size'] = pv.index.map(tr_size).astype('Int64')
+        #pv['tr-prev'] = pv.index.map(tr_prev)
+        pv = pv.drop(columns=[col for col in pv.columns if col[-1] == "All"])
+        print(f'{problem_type=} {column=}')
+        print(pv)
+        print('-'*80)

--- a/BayesianKDEy/kdey_bandwidth_selection.py
+++ b/BayesianKDEy/kdey_bandwidth_selection.py
@ -0,0 +1,134 @@
+import numpy as np
+from sklearn.linear_model import LogisticRegression, LogisticRegressionCV
+from sklearn.neighbors import KernelDensity
+from scipy.special import logsumexp
+from sklearn.model_selection import StratifiedKFold, cross_val_predict
+
+
+
+def class_scale_factors(X, y):
+    lambdas = {}
+    scales = []
+    for c in np.unique(y):
+        Xc = X[y == c]
+        cov = np.cov(Xc.T)
+        scale = np.trace(cov)
+        lambdas[c] = scale
+        scales.append(scale)
+
+    mean_scale = np.mean(scales)
+    for c in lambdas:
+        lambdas[c] /= mean_scale
+
+    return lambdas
+
+
+class ClassConditionalKDE:
+    def __init__(self, kernel="gaussian", lambdas=None):
+        self.kernel = kernel
+        self.lambdas = lambdas or {}
+        self.models = {}
+
+    def fit(self, X, y, bandwidth):
+        self.classes_ = np.unique(y)
+        for c in self.classes_:
+            h_c = bandwidth * self.lambdas.get(c, 1.0)
+            kde = KernelDensity(kernel=self.kernel, bandwidth=h_c)
+            kde.fit(X[y == c])
+            self.models[c] = kde
+        return self
+
+    def log_density(self, X):
+        logp = np.column_stack([
+            self.models[c].score_samples(X)
+            for c in self.classes_
+        ])
+        return logp
+
+
+
+def conditional_log_likelihood(logp, y, priors=None):
+    if priors is None:
+        priors = np.ones(logp.shape[1]) / logp.shape[1]
+
+    log_prior = np.log(priors)
+    log_joint = logp + log_prior
+
+    denom = logsumexp(log_joint, axis=1)
+    num = log_joint[np.arange(len(y)), y]
+
+    return np.sum(num - denom)
+
+
+def cv_objective(
+    bandwidth,
+    X,
+    y,
+    lambdas,
+    kernel="gaussian",
+    n_splits=5,
+):
+    skf = StratifiedKFold(n_splits=n_splits, shuffle=True, random_state=0)
+    score = 0.0
+
+    for train, test in skf.split(X, y):
+        model = ClassConditionalKDE(kernel=kernel, lambdas=lambdas)
+        model.fit(X[train], y[train], bandwidth)
+
+        logp = model.log_density(X[test])
+        score += conditional_log_likelihood(logp, y[test])
+
+    return score
+
+
+if __name__ == '__main__':
+
+    from BayesianKDEy.datasets import UCIMulticlassHandler
+    from quapy.method.aggregative import KDEyML
+    from quapy.model_selection import GridSearchQ
+    from quapy.evaluation import evaluation_report
+
+    dataset = UCIMulticlassHandler('academic-success')
+    training = dataset.get_training()
+    X, y = training.Xy
+
+    cls = LogisticRegression()
+    P = cross_val_predict(cls, X, y, cv=5, n_jobs=-1, method='predict_proba')
+
+    bandwidths = np.logspace(-3, 0, 50)
+    lambdas=None
+
+    scores = [
+        cv_objective(h, P, y, lambdas)
+        for h in bandwidths
+    ]
+
+    best_h = bandwidths[np.argmax(scores)]
+    print(best_h)
+
+    cls = LogisticRegression()
+    kdey = KDEyML(cls, val_split=5, random_state=0)
+    train, val_prot = dataset.get_train_valprot_for_modsel()
+    modsel = GridSearchQ(kdey, param_grid={'bandwidth': bandwidths}, protocol=val_prot, n_jobs=-1, verbose=True)
+    modsel.fit(*train.Xy)
+    best_bandwidth = modsel.best_params_['bandwidth']
+    print(best_bandwidth)
+
+    print(f'First experiment, with bandwidth={best_h:.4f}')
+    cls = LogisticRegression()
+    kdey=KDEyML(cls, val_split=5, random_state=0, bandwidth=best_h)
+    train, test_prot = dataset.get_train_testprot_for_eval()
+    kdey.fit(*train.Xy)
+    report = evaluation_report(kdey, test_prot, error_metrics=['ae'])
+    print(report.mean(numeric_only=True))
+
+    print(f'Second experiment, with bandwidth={best_bandwidth:.4f}')
+    cls = LogisticRegression()
+    kdey=KDEyML(cls, val_split=5, random_state=0, bandwidth=best_bandwidth)
+    # train, test_prot = dataset.get_train_testprot_for_eval()
+    kdey.fit(*train.Xy)
+    report = evaluation_report(kdey, test_prot, error_metrics=['ae'])
+    print(report.mean(numeric_only=True))
+
+
+
--- a/BayesianKDEy/plot_simplex.py
+++ b/BayesianKDEy/plot_simplex.py
@ -4,10 +4,11 @@ from pathlib import Path

 import numpy as np
 import matplotlib.pyplot as plt
-from matplotlib.colors import ListedColormap
+from matplotlib.colors import ListedColormap, LinearSegmentedColormap
 from scipy.stats import gaussian_kde
+from sklearn.preprocessing import MinMaxScaler

-from BayesianKDEy.commons import antagonistic_prevalence
+from BayesianKDEy.commons import antagonistic_prevalence, in_simplex
 from method.confidence import (ConfidenceIntervals as CI,
                               ConfidenceEllipseSimplex as CE,
                               ConfidenceEllipseCLR as CLR,
@ -269,19 +270,70 @@ def plot_points(ax, point_layers):
            **style
        )

+def plot_density(
+    ax,
+    density_fn,
+    resolution,
+    densecolor="blue",
+    alpha=1,
+    high_contrast=True  # maps the density values to [0,1] to enhance visualization with the cmap
+):
+    xs = np.linspace(-0.2, 1.2, resolution)
+    ys = np.linspace(-0.2, np.sqrt(3)/2 + 0.2, resolution)
+    grid_x, grid_y = np.meshgrid(xs, ys)
+
+    white_to_color = LinearSegmentedColormap.from_list(
+        "white_to_color",
+        ["white", densecolor]
+    )
+
+    pts_bary = barycentric_from_xy(grid_x, grid_y)
+
+    density = np.zeros(grid_x.shape)
+    flat_pts = pts_bary.reshape(-1, 3)
+
+    density_vals = np.array(density_fn(flat_pts))
+    #density_vals = np.array([density_fn(p) for p in flat_pts])
+    if high_contrast:
+        min_v, max_v = np.min(density_vals), np.max(density_vals)
+        density_vals = (density_vals - min_v)/(max_v-min_v)
+    density[:] = density_vals.reshape(grid_x.shape)
+
+
+    ax.pcolormesh(
+        xs,
+        ys,
+        density,
+        shading="auto",
+        cmap=white_to_color,
+        alpha=alpha,
+    )
+

 def plot_simplex(
    point_layers=None,
    region_layers=None,
-    region_resolution=1000,
+    density_function=None,
+    density_color="#1f77b4", # blue from tab10
+    density_alpha=1,
+    resolution=1000,
    confine_region_in_simplex=False,
    show_legend=True,
    save_path=None,
 ):
    fig, ax = plt.subplots(figsize=(6, 6))

+    if density_function is not None:
+        plot_density(
+            ax,
+            density_function,
+            resolution,
+            density_color,
+            density_alpha,
+        )
+
    if region_layers:
-        plot_regions(ax, region_layers, region_resolution, confine_region_in_simplex)
+        plot_regions(ax, region_layers, resolution, confine_region_in_simplex)

    if point_layers:
        plot_points(ax, point_layers)
@ -304,11 +356,80 @@ def plot_simplex(
    plt.tight_layout()
    if save_path:
        os.makedirs(Path(save_path).parent, exist_ok=True)
-        plt.savefig(save_path)
+        plt.savefig(save_path, bbox_inches="tight")
    else:
        plt.show()


+def gaussian_kernel(p, mu=np.array([0.6, 0.2, 0.2]), sigma=0.5):
+    return np.exp(-np.sum((p - mu) ** 2) / (2 * sigma ** 2))
+
+
+def plot_kernels():
+    from quapy.method._kdey import KDEBase
+
+    kernel = 'aitchison'
+
+    def kernel(p, center, bandwidth=0.1, kernel='gaussian', within_simplex=False):
+        assert within_simplex or kernel == 'gaussian', f'cannot compute {kernel=} outside the simplex'
+        X = np.asarray(center).reshape(-1, 3)
+        p = np.asarray(p).reshape(-1, 3)
+        KDE = KDEBase()
+        kde = KDE.get_kde_function(X, bandwidth=bandwidth, kernel=kernel)
+
+        if within_simplex:
+            density = np.zeros(shape=p.shape[0])
+            p_mask = in_simplex(p)
+            density_vals = KDE.pdf(kde, p[p_mask], kernel=kernel)
+            density[p_mask] = density_vals
+        else:
+            density = KDE.pdf(kde, p, kernel=kernel)
+        return density
+
+    plt.rcParams.update({
+        'font.size': 15,
+        'axes.titlesize': 12,
+        'axes.labelsize': 10,
+        'xtick.labelsize': 8,
+        'ytick.labelsize': 8,
+        'legend.fontsize': 9,
+    })
+
+    dot_style = {"color": "red", "alpha": 1, "s": 100, 'linewidth': 1.5, 'edgecolors': "white"}
+    # center = np.asarray([[0.05, 0.03, 0.92],[0.5, 0.4, 0.1]])
+    center = np.asarray([0.33, 0.33, 0.34])
+    point_layer = [
+        {"points": center, "label": "kernels", "style": dot_style},
+    ]
+    density_fn = lambda p: kernel(p, center, bandwidth=0.2, kernel='gaussian', within_simplex=False)
+    plot_simplex(point_layers=point_layer, density_function=density_fn, show_legend=False,
+                 save_path='./plots/kernels/gaussian_center.png')
+
+    density_fn = lambda p: kernel(p, center, bandwidth=.6, kernel='aitchison', within_simplex=True)
+    plot_simplex(point_layers=point_layer, density_function=density_fn, show_legend=False,
+                 save_path='./plots/kernels/aitchison_center.png')
+
+    center = np.asarray([0.05, 0.05, 0.9])
+    point_layer[0]['points'] = center
+    density_fn = lambda p: kernel(p, center, bandwidth=0.2, kernel='gaussian', within_simplex=False)
+    plot_simplex(point_layers=point_layer, density_function=density_fn, show_legend=False,
+                 save_path='./plots/kernels/gaussian_vertex_005_005_09.png')
+
+    density_fn = lambda p: kernel(p, center, bandwidth=1, kernel='aitchison', within_simplex=True)
+    plot_simplex(point_layers=point_layer, density_function=density_fn, show_legend=False,
+                 save_path='./plots/kernels/aitchison_vertex_005_005_09.png')
+
+    center = np.asarray([0.45, 0.45, 0.1])
+    point_layer[0]['points'] = center
+    density_fn = lambda p: kernel(p, center, bandwidth=0.2, kernel='gaussian', within_simplex=False)
+    plot_simplex(point_layers=point_layer, density_function=density_fn, show_legend=False,
+                 save_path='./plots/kernels/gaussian_border_045_045_01.png')
+
+    density_fn = lambda p: kernel(p, center, bandwidth=.7, kernel='aitchison', within_simplex=True)
+    plot_simplex(point_layers=point_layer, density_function=density_fn, show_legend=False,
+                 save_path='./plots/kernels/aitchison_border_045_045_01.png')
+
+
 if __name__ == '__main__':
    np.random.seed(1)

@ -370,6 +491,7 @@ if __name__ == '__main__':
    train_style = {"color": "blue", "alpha": 0.5, "s":15, 'linewidth':0.5, 'edgecolors':None}
    test_style = {"color": "red", "alpha": 0.5, "s": 15, 'linewidth': 0.5, 'edgecolors': None}

+
    # train_prevs = np.random.dirichlet(alpha=[1, 1, 1], size=n)
    # test_prevs = np.random.dirichlet(alpha=[1, 1, 1], size=n)
    # plot_simplex(
@ -401,23 +523,25 @@ if __name__ == '__main__':
    #     save_path=f'./plots/prior_test/wrong.png'
    # )

-    p = 0.6
+    # p = 0.6
+    #
+    # K = 3
+    # # alpha = [p] + [(1. - p) / (K - 1)] * (K - 1)
+    # alpha = [0.095, 0.246, 0.658]  # connect-4
+    # alpha = np.array(alpha)
+    #
+    #
+    # for c in [50, 500, 5_000]:
+    #     alpha_tr = alpha * c
+    #     alpha_te = antagonistic_prevalence(alpha, strength=1) * c
+    #     train_prevs = np.random.dirichlet(alpha=alpha_tr, size=n)
+    #     test_prevs = np.random.dirichlet(alpha=alpha_te, size=n)
+    #     plot_simplex(
+    #         point_layers=[
+    #             {"points": train_prevs, "label": "train", "style": train_style},
+    #             {"points": test_prevs, "label": "test", "style": test_style},
+    #         ],
+    #         save_path=f'./plots/prior_test/concentration_{c}.png'
+    #     )

-    K = 3
-    # alpha = [p] + [(1. - p) / (K - 1)] * (K - 1)
-    alpha = [0.095, 0.246, 0.658]  # connect-4
-    alpha = np.array(alpha)
-
-
-    for c in [50, 500, 5_000]:
-        alpha_tr = alpha * c
-        alpha_te = antagonistic_prevalence(alpha, strength=1) * c
-        train_prevs = np.random.dirichlet(alpha=alpha_tr, size=n)
-        test_prevs = np.random.dirichlet(alpha=alpha_te, size=n)
-        plot_simplex(
-            point_layers=[
-                {"points": train_prevs, "label": "train", "style": train_style},
-                {"points": test_prevs, "label": "test", "style": test_style},
-            ],
-            save_path=f'./plots/prior_test/concentration_{c}.png'
-        )
+    plot_kernels()
--- a/BayesianKDEy/temperature_calibration.py
+++ b/BayesianKDEy/temperature_calibration.py
@ -27,22 +27,28 @@ def temp_calibration(method:WithConfidenceABC,
    if isinstance(amplitude_threshold, float) and amplitude_threshold > 0.1:
        print(f'warning: the {amplitude_threshold=} is too large; this may lead to uninformative regions')

-    def evaluate_temperature_job(temp):
+    def evaluate_temperature_job(job_id, temp):
+        if verbose:
+            print(f'\tstarting exploration with temperature={temp}...')
+
        local_method = copy.deepcopy(method)
        local_method.temperature = temp

        coverage = 0
        amplitudes = []
-        errs = []
+        # errs = []

-        for i, (sample, prev) in enumerate(val_prot()):
+        pbar = tqdm(enumerate(val_prot()), position=job_id, total=val_prot.total(), disable=not verbose)
+
+        for i, (sample, prev) in pbar:
            point_estim, conf_region = local_method.predict_conf(sample)

            if prev in conf_region:
                coverage += 1

            amplitudes.append(conf_region.montecarlo_proportion(n_trials=50_000))
-            errs.append(qp.error.mae(prev, point_estim))
+            # errs.append(qp.error.mae(prev, point_estim))
+            pbar.set_description(f'job={job_id} T={temp}: coverage={coverage/(i+1)*100:.2f}% amplitude={np.mean(amplitudes)*100:.2f}%')

        mean_coverage = coverage / val_prot.total()
        mean_amplitude = np.mean(amplitudes)
@ -56,8 +62,8 @@ def temp_calibration(method:WithConfidenceABC,
    method.fit(*train.Xy)

    raw_results = Parallel(n_jobs=n_jobs, backend="loky")(
-        delayed(evaluate_temperature_job)(temp)
-        for temp in tqdm(temp_grid, disable=not verbose)
+        delayed(evaluate_temperature_job)(job_id, temp)
+        for job_id, temp in tqdm(enumerate(temp_grid), disable=not verbose)
    )
    results = [
        (temp, cov, amp)
--- a/quapy/data/_lequa.py
+++ b/quapy/data/_lequa.py
@ -99,6 +99,9 @@ class SamplesFromDir(AbstractProtocol):
            sample, _ = self.load_fn(os.path.join(self.path_dir, f'{id}.txt'))
            yield sample, prevalence

+    def total(self):
+        return len(self.true_prevs)
+

 class LabelledCollectionsFromDir(AbstractProtocol):

@ -113,6 +116,9 @@ class LabelledCollectionsFromDir(AbstractProtocol):
            lc = LabelledCollection.load(path=collection_path, loader_func=self.load_fn)
            yield lc

+    def total(self):
+        return len(self.true_prevs)
+

 class ResultSubmission: