Source code for pymint.main.interpret_toolkit

import numpy as np
import xarray as xr
import pandas as pd
import itertools

# Computation imports
from ..common.attributes import Attributes
from .local_interpret import LocalInterpret
from .global_interpret import GlobalInterpret

# Plotting imports
from ..plot.plot_interpret_curves import PlotInterpretCurves
from ..plot.plot_permutation_importance import PlotImportance
from ..plot.plot_feature_contributions import PlotFeatureContributions
from ..plot.plot_2D import PlotInterpret2D
from ..plot._box_and_whisker import box_and_whisker
from ..plot._kde_2d import PlotScatter

from ..common.utils import (
    to_xarray,
    get_indices_based_on_performance,
    retrieve_important_vars,
    load_netcdf,
    load_dataframe,
    save_netcdf,
    save_dataframe,
    combine_top_features,
    determine_feature_dtype,
    is_str,
    is_list,
    is_dataset,
    is_dataframe,
    compute_importance
    )

[docs]class InterpretToolkit(Attributes):

    """
    
    InterpretToolkit is the primary interface of PyMint. The modules contained within compute several
    interpretable machine learning (IML) methods such as 
    
    Feature importance: 
        
        * `permutation_importance`
        * `ale_variance`
        
    Feature Attributions:
        
        - `ale`
        - `pd`
        - `ice`
        - `shap`
        - `local_contributions`
        
    Feature Interactions:
    
        - `interaction_strength`
        - `ale_variance`
        - `perm_based_interaction`
        - `friedman_h_stat`
        - `main_effect_complexity`
        - `ale`
        - `pd`
    
    Additionally, there are corresponding plotting modules for 
    each IML method, which are designed to produce publication-quality graphics. 
    
    .. note:: 
        InterpretToolkit is designed to work with estimators that implement predict or predict_proba. 
        
    .. caution::
        InterpretToolkit is only designed to work with binary classification and regression problems. 
        In future versions of PyMint, we hope to be compatiable with multi-class classification. 
    
    
    Parameters
    -----------
    
    estimators : list of tuples of (estimator name, fitted estimator)
        Tuple of (estimator name, fitted estimator object) or list thereof where the 
        fitted estimator must implement ``predict`` or ``predict_proba``.
        Multioutput-multiclass classifiers are not supported.

    X : {array-like or dataframe} of shape (n_samples, n_features)
        Training or validation data used to compute the IML methods.
        If ndnumpy.array, must specify `feature_names`.

    y : {list or numpy.array} of shape (n_samples,)
        The target values (class labels in classification, real numbers in regression).

    estimator_output : ``"raw"`` or ``"probability"``
        What output of the estimator should be explained. Determined internally by
        InterpretToolkit. However, if using a classification model, the user
        can set to "raw" for non-probabilistic output. 

    feature_names : array-like of shape (n_features,), dtype=str, default=None
        Name of each feature; ``feature_names[i]`` holds the name of the feature
        with index ``i``. By default, the name of the feature corresponds to their numerical
        index for NumPy array and their column name for pandas dataframe. 
        Feature names are only required if ``X`` is an ndnumpy.array, a it will be 
        converted to a pandas.DataFrame internally. 
    
    Raises
    ---------
    AssertError
        Number of estimator objects is not equal to the number of estimator names given!
    TypeError
        y variable must be numpy array or pandas.DataFrame.
    Exception
        Feature names must be specified if X is an numpy.array.
    ValueError
        estimator_output is not an accepted option.
    
    """

    def __init__(self, estimators=None, 
                 X=pd.DataFrame(np.array([])), 
                 y=np.array([]),
                 estimator_output=None,
                 feature_names=None):

        if estimators is not None:
            if not is_list(estimators) and estimators:
                estimators = [estimators]
            estimator_names = [e[0] for e in estimators]
            estimators = [e[1] for e in estimators]
        else:
            estimator_names = None 

        self.set_estimator_attribute(estimators, estimator_names)
        self.set_y_attribute(y)
        self.set_X_attribute(X, feature_names)
        self.set_estimator_output(estimator_output, estimators)
        self.checked_attributes = True

        # Initialize a global interpret object
        self.global_obj = GlobalInterpret(estimators=self.estimators,
                                      estimator_names=self.estimator_names,
                                      X=self.X,
                                      y =self.y,
                                      estimator_output=self.estimator_output,
                                     checked_attributes=self.checked_attributes)

        # Initialize a local interpret object
        self.local_obj = LocalInterpret(estimators=self.estimators,
                            estimator_names=self.estimator_names,
                            X=self.X,
                            y=self.y,
                            estimator_output=self.estimator_output,
                            checked_attributes=self.checked_attributes
                            )
        
        self.attrs_dict = {
                      'estimator_output' : self.estimator_output,
                      'estimators used' : self.estimator_names
                     }

    def __repr__(self):
        return 'InterpretToolkit(estimator=%s \n \
                                 estimator_names=%s \n \
                                 X=%s length:%d \n \
                                 y=%s length:%d \n \
                                 estimator_output=%s \n \
                                 feature_names=%s length %d)' % \
                                 (self.estimators,
                                 self.estimator_names,
                                 type(self.X), len(self.X),
                                 type(self.y), len(self.y),
                                 self.estimator_output,
                                 type(self.feature_names), len(self.feature_names))

    def _append_attributes(self,ds):
        """
        FOR INTERNAL PURPOSES ONLY.
        
        Append attributes to a xarray.Dataset or pandas.DataFrame

        Parameters
        ----------
        
        ds : xarray.Dataset or pandas.DataFrame
            Results data from the IML methods 
        
        """

        for key in self.attrs_dict.keys():
            ds.attrs[key] = self.attrs_dict[key]
            
        return ds
    
[docs]    def permutation_importance(self, n_vars, evaluation_fn, direction='backward',
            subsample=1.0, n_jobs=1, n_permute=1, scoring_strategy=None, verbose=False, 
             return_iterations=False, random_seed=1,                
                              ):
        """
        Performs single-pass and/or multi-pass permutation importance using a modified version of the
        PermutationImportance package (pymint.PermutationImportance) [1]_. The single-pass approach was first 
        developed in Brieman (2001) [2]_ and then improved upon in Lakshmanan et al. (2015) [3]_. 
         
        .. attention :: 
                The permutation importance rankings can be sensitive to the evaluation function used. 
                Consider re-computing with multiple evaluation functions. 
                
        .. attention :: 
                The permutation importance rankings can be sensitive to the direction used. 
                Consider re-computing with both forward- and backward-based methods.         
        
        .. hint :: 
            Since the permutation importance is a marginal-based method, you can often use 
            subsample << 1.0 without substantially altering the feature rankings. 
            Using a subsample << 1.0 can reduce the computation time for larger datasets (e.g., >100 K X), 
            especially since 100-1000s of bootstrap iterations are often required for reliable rankings. 

        Parameters
        ----------
        
        n_vars : integer
            number of variables to calculate the multipass permutation importance for. If ``n_vars=1``, then 
            only the single-pass permutation importance is computed. If ``n_vars>1``, both the single-pass 
            and multiple-pass are computed. 
        
        evaluation_fn : string or callable 
            evaluation/scoring function for evaluating the loss of skill once a feature is permuted. 
            evaluation_fn can be set to one of the following strings:
            
                - ``"auc"``, Area under the Curve
                - ``"auprc"``, Area under the Precision-Recall Curve
                - ``"bss"``, Brier Skill Score
                - ``"mse"``, Mean Square Error
                - ``"norm_aupdc"``,  Normalized Area under the Performance Diagram (Precision-Recall) Curve
                
            Otherwise, evaluation_fn can be any function of form, 
            `evaluation_fn(targets, predictions)` and must return a scalar value
            
            When using a custom function, you must also set the scoring strategy (see below).
        
        scoring_strategy : string (default=None)
        
            This argument is only required if you are using a non-default evaluation_fn (see above)
        
            If the evaluation_fn is positively-oriented (a higher value is better), 
            then set ``scoring_strategy = "argmin_of_mean"`` and if it is negatively-oriented-
            (a lower value is better), then set ``scoring_strategy = "argmax_of_mean"``
            
        direction : ``"forward"`` or ``"backward"``
        
            For the multi-pass method. For ``"backward"``, the top feature is left permuted before determining
            the second-most important feature (and so on). For ``"forward"``, all features are permuted
            and then the top features are progressively left unpermuted. For real-world datasets, the two
            methods often do not produce the same feature rankings and is worth exploring both. 
      
        subsample: float or integer (default=1.0 for no subsampling)
        
            if value is between 0-1, it is interpreted as fraction of total X to use 
            if value > 1, interpreted as the number of X to randomly sample 
            from the original dataset.
        
        n_jobs : interger or float (default=1; no multiprocessing)
        
            if integer, interpreted as the number of processors to use for multiprocessing
            if float between 0-1, interpreted as the fraction of proceesors to use for multiprocessing
        
        n_permute: integer (default=1 for only one permutation per feature)
            Number of permutations for computing confidence intervals on the feature rankings. 
            
        random_seed : int, RandomState instance, default=None
        
            Pseudo-random number generator to control the permutations of each
            feature. Pass an int to get reproducible results across function calls.
        
        verbose : boolean
            True for print statements on the progress
        
        Returns
        --------
        results : xarray.DataSet 
            Permutation importance results. Includes the both multi-pass and single-pass 
            feature rankings and the scores with the various features permuted. 
        
        References 
        -----------
        .. [1] https://github.com/gelijergensen/PermutationImportance
        
        .. [2] L. Breiman, "Random Forests", Machine Learning, 45(1), 5-32, 2001.
        
        .. [3] Lakshmanan, V., C. Karstens, J. Krause, K. Elmore, A. Ryzhkov, and S. Berkseth, 2015: 
               Which Polarimetric Variables Are Important for Weather/No-Weather Discrimination? 
               Journal of Atmospheric and Oceanic Technology, 32, 1209–1223, 
               https://doi.org/10.1175/jtech-d-13-00205.1.
        
        Examples
        ----------
        >>> import pymint
        >>> # pre-fit estimators within pymint
        >>> estimators = pymint.load_models() 
        >>> X, y = pymint.load_data() # training data 
        >>> # Only compute for the first model
        >>> explainer = pymint.InterpretToolkit(estimators=estimators[0],
        ...                             X=X,
        ...                             y=y,
        ...                            )
        >>> perm_imp_results = explainer.permutation_importance( 
        ...                       n_vars=10,
        ...                       evaluation_fn = 'norm_aupdc',
        ...                       subsample=0.5,
        ...                       n_permute=20, 
        ...                       )
        >>> print(perm_imp_results)
        <xarray.Dataset>
            Dimensions:           (n_permute: 20, n_vars_multipass: 10, n_vars_singlepass: 30)
            Dimensions without coordinates: n_permute, n_vars_multipass, n_vars_singlepass
            Data variables:
                multipass_rankings__Random Forest   (n_vars_multipass) <U17 'sfc_te...
                multipass_scores__Random Forest     (n_vars_multipass, n_permute) float64 ...
                singlepass_rankings__Random Forest  (n_vars_singlepass) <U17 'sfc_t...
                singlepass_scores__Random Forest    (n_vars_singlepass, n_permute) float64 ...
                original_score__Random Forest       (n_permute) float64 0.9851 .....
            Attributes:
                estimator_output:  probability
                estimators used:   ['Random Forest']
                n_multipass_vars:  10
                method:            permutation_importance
                direction:         backward
                evaluation_fn:     norm_aupdc
        """
        results_ds, orientation = self.global_obj.calc_permutation_importance(n_vars=n_vars,
                                                    evaluation_fn=evaluation_fn,
                                                    subsample=subsample,
                                                    n_jobs=n_jobs,
                                                    n_permute=n_permute,
                                                    scoring_strategy=scoring_strategy,
                                                    verbose=verbose,
                                                    direction=direction,
                                                    return_iterations=return_iterations,
                                                    random_seed=random_seed,
                                                   )

        self.attrs_dict['n_multipass_vars'] = n_vars
        self.attrs_dict['method'] = 'permutation_importance'
        self.attrs_dict['direction'] = direction
        self.attrs_dict['evaluation_fn'] = evaluation_fn
        results_ds = self._append_attributes(results_ds)
    
        # Convert the permutation scores to proper importance scores. 
        results_ds = compute_importance(results_ds, orientation)
        
        return results_ds

    
[docs]    def grouped_permutation_importance(self, perm_method, 
                                       evaluation_fn, n_permute=1, groups=None,
                                      sample_size=100, subsample=1.0, n_jobs=1, 
                                      clustering_kwargs={'n_clusters' : 10}):
        """
        The group only permutation feature importance (GOPFI) from Au et al. 2021 [1]_
        (see their equations 10 and 11). This function has a built-in method for clustering 
        features using the sklearn.cluster.FeatureAgglomeration. It also has the ability to 
        compute the results over multiple permutations to improve the feature importance 
        estimate (and provide uncertainty). 
    
        Original score = Jointly permute all features 
        Permuted score = Jointly permuting all features except the considered group
    
        Loss metrics := Original_score - Permuted Score 
        Skill Score metrics := Permuted score - Original Score 
    
    
        Parameters
        ----------------
        
        perm_method : ``"grouped"`` or ``"grouped_only"``
        
            If ``"grouped"``, the features within a group are jointly permuted and other features 
            are left unpermuted. 
            
            If ``"grouped_only"``, only the features within a group are left unpermuted and 
            other features are jointly permuted. 

        
        evaluation_fn : string or callable 
            evaluation/scoring function for evaluating the loss of skill once a feature is permuted. 
            evaluation_fn can be set to one of the following strings:
            
                - ``"auc"``, Area under the Curve
                - ``"auprc"``, Area under the Precision-Recall Curve
                - ``"bss"``, Brier Skill Score
                - ``"mse"``, Mean Square Error
                - ``"norm_aupdc"``,  Normalized Area under the Performance Diagram (Precision-Recall) Curve
                
            Otherwise, evaluation_fn can be any function of form, 
            `evaluation_fn(targets, predictions)` and must return a scalar value
            
            When using a custom function, you must also set the scoring strategy (see below).
   
        n_permute: integer (default=1 for only one permutation per feature)
                Number of permutations for computing confidence intervals on the feature rankings.
    
        groups : dict (default=None)
                Dictionary of group names and the feature names or feature column indices. 
                If None, then the feature groupings are determined internally based on 
                feature clusterings. 
            
        sample_size : integer (default=100)
                Number of random samples to determine the correlation for the feature clusterings
            
        subsample: float or integer (default=1.0 for no subsampling)
        
                if value is between 0-1, it is interpreted as fraction of total X to use 
                if value > 1, interpreted as the number of X to randomly sample 
                from the original dataset. 
        
        n_jobs : interger or float (default=1; no multiprocessing)
        
            if integer, interpreted as the number of processors to use for multiprocessing
            if float between 0-1, interpreted as the fraction of proceesors to use for multiprocessing
        
        clustering_kwargs : dict (default = {'n_clusters' : 10})
            See https://scikit-learn.org/stable/modules/generated/sklearn.cluster.FeatureAgglomeration.html 
            for details 
               
        Returns
        ----------------
    
        results : xarray.DataSet 
            Permutation importance results. Includes the both multi-pass and single-pass 
            feature rankings and the scores with the various features permuted. 
    
        groups : dict
            If groups is None, then it returns the groups that were 
            automatically created in the feature clustering. Otherwise, 
            only results is returned. 
    
        References 
        -----------
        .. [1] Au, Q., J. Herbinger, C. Stachl, B. Bischl, and G. Casalicchio, 2021: 
        Grouped Feature Importance and Combined Features Effect Plot. Arxiv,.
    
        Examples
        ----------
        >>> import pymint
        >>> # pre-fit estimators within pymint
        >>> estimators = pymint.load_models() 
        >>> X, y = pymint.load_data() # training data 
        >>> # Only compute for the first model
        >>> explainer = pymint.InterpretToolkit(estimators=estimators[0],
        ...                             X=X,
        ...                             y=y,
        ...                            )
        >>> # Group only, the features within a group are the only one's left unpermuted 
        >>> results, groups = explainer.grouped_permutation_importance( 
        ...                                          perm_method = 'grouped_only',
        ...                                          evaluation_fn = 'norm_aupdc',)
        >>> print(results)
        <xarray.Dataset>
            Dimensions:                        (n_vars_group: 10, n_bootstrap: 1)
            Dimensions without coordinates: n_vars_group, n_bootstrap
            Data variables:
                group_rankings__Random Forest  (n_vars_group) <U7 'group 3' ... 'group 4'
                group_scores__Random Forest    (n_vars_group, n_bootstrap) float64 0.4822...
            Attributes:
                estimators used:   ['Random Forest']
                estimator output:  probability
                estimator_output:  probability
                groups:            {'group 0': array(['d_rad_d', 'd_rad_u'], dtype=object...
                method:            grouped_permutation_importance
                perm_method:       grouped_only
                evaluation_fn:     norm_aupdc
        >>> print(groups)
        {'group 0': array(['d_rad_d', 'd_rad_u'], dtype=object), 
        'group 1': array(['high_cloud', 'lat_hf', 'mid_cloud', 'sfcT_hrs_ab_frez', 'date_marker'], dtype=object),
        'group 2': array(['dllwave_flux', 'uplwav_flux'], dtype=object),
        'group 3': array(['dwpt2m', 'fric_vel', 'sat_irbt', 'sfc_rough', 'sfc_temp',
       'temp2m', 'wind10m', 'urban', 'rural', 'hrrr_dT'], dtype=object), 
       'group 4': array(['low_cloud', 'tot_cloud', 'vbd_flux', 'vdd_flux'], dtype=object), 
       'group 5': array(['gflux', 'd_ground'], dtype=object), 
       'group 6': array(['sfcT_hrs_bl_frez', 'tmp2m_hrs_bl_frez'], dtype=object), 
       'group 7': array(['swave_flux'], dtype=object), 
       'group 8': array(['sens_hf'], dtype=object), 
       'group 9': array(['tmp2m_hrs_ab_frez'], dtype=object)
       }
        """
        return_names=False
        if groups is None:
            return_names=True
        
        results_ds, groups = self.global_obj.grouped_feature_importance(
                                   evaluation_fn=evaluation_fn, 
                                   perm_method=perm_method,
                               n_permute=n_permute, 
                               groups=groups, 
                               sample_size=sample_size, 
                               subsample=subsample, 
                               clustering_kwargs=clustering_kwargs,
                               n_jobs=n_jobs)

        
        for k,v in groups.items():
            self.attrs_dict[k] =list(v)
            
        self.attrs_dict['method'] = 'grouped_permutation_importance'
        self.attrs_dict['perm_method'] = perm_method
        self.attrs_dict['evaluation_fn'] = evaluation_fn
        results_ds = self._append_attributes(results_ds)
        
        if return_names:
            return results_ds, groups 
        else:
            return results_ds

[docs]    def ale_variance(self, 
                     ale,
                     features=None, 
                          estimator_names=None,
                          interaction=False, 
                         ):
        """
        Compute the standard deviation (std) of the ALE values for each 
        features in a dataset and then rank by the magnitude. A higher std(ALE) indicates a 
        greater expected contribution to an estimator's prediction and is thus considered more important. 
        If ``interaction=True``, then the method computes a similar method for the 
        2D ALE to measure the feature interaction strength. 
        
        This method is inspired by the feature importance and interaction 
        methods developed in Greenwell et al. (2018) [4]_.
        
        Parameters
        ----------
        
        ale : xarray.Dataset
            
            Results of :func:`~InterpretToolkit.ale` for
            ``features``.
            
        features : 'all', string, list of strings, list of 2-tuples
            
            Features to compute the ALE variance for. If set to ``'all'``, it is 
            computed for all features. If ``interaction=True``, then features
            must be a list of 2-tuples for computing the interaction between
            the set of feature combinations. 
            
        estimator_names : string, list of strings
        
            If using multiple estimators, you can pass a single (or subset of) estimator name(s) 
            to compute the ALE variance for. 
        
        interaction : boolean 
        
            - If True, it computes the feature interaction strength
            - If False, compute the feature importance 

        Returns
        --------
        
        results_ds : xarray.Dataset
            ALE variance results. Includes both the rankings and scores. 
        
        References
        -------------
        
        .. [4] Greenwell, B. M., B. C. Boehmke, and A. J. McCarthy, 2018: 
               A Simple and Effective estimator-Based Variable Importance Measure. Arxiv,.
        
        
        Examples
        -----------
        >>> import pymint
        >>> import itertools
        >>> # pre-fit estimators within pymint
        >>> estimators = pymint.load_models() 
        >>> X, y = pymint.load_data() # training data 
        >>> explainer = pymint.InterpretToolkit(estimators=estimators,
        ...                             X=X,
        ...                             y=y,
        ...                            )
        >>> ale = explainer.ale(features='all', n_bins=10, subsample=1000, n_bootstrap=1)
        >>> # Compute 1D ALE variance
        >>> ale_var_results = explainer.ale_variance(ale)
        >>> print(ale_var_results)
        <xarray.Dataset>
        Dimensions:    (n_bootstrap: 1, n_vars_ale_variance: 30)
        Dimensions without coordinates: n_bootstrap, n_vars_ale_variance
        Data variables:
            ale_variance_rankings__Random Forest        (n_vars_ale_variance) <U17 'r...
            ale_variance_scores__Random Forest          (n_vars_ale_variance, n_bootstrap) float64 ...
            ale_variance_rankings__Gradient Boosting    (n_vars_ale_variance) <U17 'u...
            ale_variance_scores__Gradient Boosting      (n_vars_ale_variance, n_bootstrap) float64 ...
            ale_variance_rankings__Logistic Regression  (n_vars_ale_variance) <U17 'r...
            ale_variance_scores__Logistic Regression    (n_vars_ale_variance, n_bootstrap) float64 ...
        Attribute:
            estimator_output:  probability
            estimators used:   ['Random Forest', 'Gradient Boosting', 'Logistic Regre...
            n_multipass_vars:  5
            method:            ale_variance
            direction:         backward
            evaluation_fn:     sigma_ale
            dimension:         1D
            features used:     ['dllwave_flux', 'dwpt2m', 'fric_vel', 'gflux', 'high_...
            estimator output:  probability
            interaction:       False
        
        >>> #Typical, we only want to evaluate the feature interactions for
        >>> # the most important features
        >>> important_vars = ['sfc_temp', 'temp2m', 'sfcT_hrs_bl_frez', 'tmp2m_hrs_bl_frez',
        ...   'uplwav_flux']
        >>> # Create all possible combinations
        >>> important_vars_2d = list(itertools.combinations(important_vars, r=2))
        >>> #For the 2D ALE variance to measure feature interaction strength
        >>> ale_2d = explainer.ale(features=important_vars_2d, n_bins=10, 
        ...              subsample=1000, n_bootstrap=1)
        >>> # Compute 2D ALE variance 
        >>> ale_var_results = explainer.ale_variance(ale_2d, features=important_vars_2d, 
        ...                    interaction=True)
        >>> print(ale_var_results)
        <xarray.Dataset>
        Dimensions:   (n_bootstrap: 1, n_vars_ale_variance_interactions: 10)
        Dimensions without coordinates: n_bootstrap, n_vars_ale_variance_interactions
        Data variables:
            ale_variance_interactions_rankings__Random Forest        (n_vars_ale_variance_interactions) <U35 ...
            ale_variance_interactions_scores__Random Forest          (n_vars_ale_variance_interactions, n_bootstrap) float64 ...
            ale_variance_interactions_rankings__Gradient Boosting    (n_vars_ale_variance_interactions) <U35 ...
            ale_variance_interactions_scores__Gradient Boosting      (n_vars_ale_variance_interactions, n_bootstrap) float64 ...
            ale_variance_interactions_rankings__Logistic Regression  (n_vars_ale_variance_interactions) <U35 ...
            ale_variance_interactions_scores__Logistic Regression    (n_vars_ale_variance_interactions, n_bootstrap) float64 ...
        Attribute:
            estimator_output:  probability
            estimators used:   ['Random Forest', 'Gradient Boosting', 'Logistic Regre...
            n_multipass_vars:  5
            method:            ale_variance
            direction:         backward
            evaluation_fn:     Interaction Importance
            dimension:         2D
            features used:     [('sfc_temp', 'temp2m'), ('sfc_temp', 'sfcT_hrs_bl_fre...
            estimator output:  probability
            interaction:       True
        """
        if (features == 'all' or features is None) and interaction:
            features = list(itertools.combinations(self.feature_names, r=2))
        
        if estimator_names is None:
            estimator_names = self.estimator_names
        
        if is_str(estimator_names):
            estimator_names = [estimator_names]
        
        if interaction:
            if ale.attrs['dimension'] != '2D':
                raise Expection("ale must be compute for second-order ALE if interaction == True")
                    
        # Check that ale_data is an xarray.Dataset
        if not isinstance(ale, xr.core.dataset.Dataset):
            raise ValueError("""
                                 ale must be an xarray.Dataset, 
                                 perferably generated by InterpretToolkit.ale 
                                 to be formatted correctly
                                 """)
        else:
            any_missing = all([m in ale.attrs['estimators used'] for m in estimator_names])
            if not any_missing:
                raise ValueError('ale does not contain values for all the estimator names given!')
                
        if interaction:
            func = self.global_obj.compute_interaction_rankings
        else:
            func = self.global_obj.compute_ale_variance
        
        results_ds = func(data=ale, estimator_names=estimator_names, features=features,)
            
        self.attrs_dict['method'] = 'ale_variance'
        self.attrs_dict['estimators used'] = estimator_names
        self.attrs_dict['estimator output'] = 'probability'
        self.attrs_dict['interaction'] = str(interaction)
        if interaction:
            self.attrs_dict['evaluation_fn'] = 'Interaction Importance'
        else:
            self.attrs_dict['evaluation_fn'] =  'sigma_ale' #'$\sigma$(ALE)'
        
        results_ds = self._append_attributes(results_ds)
        
        return results_ds

    
[docs]    def main_effect_complexity(self, ale, estimator_names=None, 
                                    max_segments=10, approx_error=0.05):
        """
        Compute the Main Effect Complexity (MEC; Molnar et al. 2019) [5]_. 
        MEC is the number of linear segements required to approximate 
        the first-order ALE curves averaged over all features. 
        The MEC is weighted-averged by the variance. Higher values indicate
        a more complex estimator (less interpretable). 
        
        References 
        -----------
        .. [5] Molnar, C., G. Casalicchio, and B. Bischl, 2019: Quantifying estimator Complexity via 
            Functional Decomposition for Better Post-Hoc Interpretability. ArXiv.
        
        
        Parameters
        ----------------
        
        ale : xarray.Dataset
            
             Results of :func:`~InterpretToolkit.ale`. Must be computed for all features in X. 

        estimator_names : string, list of strings
        
            If using multiple estimators, you can pass a single (or subset of) estimator name(s) 
            to compute the MEC for. 
            
        max_segments : integer; default=10
            
            Maximum number of linear segments used to approximate the main/first-order 
            effect of a feature. default is 10. Used to limit the computational runtime. 
            
        approx_error : float; default=0.05
        
            The accepted error of the R squared between the piece-wise linear function 
            and the true ALE curve. If the R square is within the approx_error, then 
            no additional segments are added.
            
         
        Returns
        ---------
            mec_dict : dictionary 
                mec_dict = {estimator_name0 : mec0, estimator_name1 : mec2, ..., estimator_nameN : mecN,}
                
                
        Examples
        ---------
        >>> import pymint
        >>> # pre-fit estimators within pymint
        >>> estimators = pymint.load_models() 
        >>> X, y = pymint.load_data() # training data 
        >>> explainer = pymint.InterpretToolkit(estimators=estimators,
        ...                             X=X,
        ...                             y=y,
        ...                            )
        >>> ale = explainer.ale(features='all', n_bins=20, subsample=0.5, n_bootstrap=20)
        >>> # Compute Main Effect Complexity (MEC)
        >>> mec_ds = explainer.main_effect_complexity(ale)
        >>> print(mes_ds)
        {'Random Forest': 2.6792782503392756,
         'Gradient Boosting': 2.692392706080586,
         'Logistic Regression': 1.6338281469152958}
        """
        if estimator_names is None:
            estimator_names=self.estimator_names
        else:
            if is_str(estimator_names):
                estimator_names=[estimator_names]
        
        mec_dict = {}
        for estimator_name in estimator_names:
            mec, _ = self.global_obj.compute_main_effect_complexity( 
                        estimator_name=estimator_name, 
                        ale_ds=ale,  
                        features=self.feature_names, 
                        max_segments=max_segments, 
                        approx_error=approx_error
            )
            
            mec_dict[estimator_name] = mec
        
        return mec_dict
    
[docs]    def perm_based_interaction(self, features, evaluation_fn,
                                  estimator_names=None, n_jobs=1, subsample=1.0, 
                                  n_bootstrap=1, verbose=False):
        """
        Compute the performance-based feature interactions from Oh (2019) [6]_. 
        For a pair of features, the loss of skill is recorded for permuting
        each feature separately and permuting both. If there is no feature interaction
        and the covariance between the two features is close to zero, the sum of the
        individual losses will approximately equal the loss of skill from permuting
        both features. Otherwise, a non-zero difference indicates some interaction.
        The differences for different pairs of features can be used to rank the
        strength of any feature interactions. 
        
        References
        -------------
        .. [6]  Oh, Sejong, 2019. Feature Interaction in Terms of Prediction Performance 
            https://www.mdpi.com/2076-3417/9/23/5191
            
            
        Parameters
        -----------
        
        features : list of 2-tuple of strings 
            Pairs of features to compute the interaction strength for. 
        
        evaluation_fn : string or callable 
            evaluation/scoring function for evaluating the loss of skill once a feature is permuted. 
            evaluation_fn can be set to one of the following strings:
            
                - ``"auc"``, Area under the Curve
                - ``"auprc"``, Area under the Precision-Recall Curve
                - ``"bss"``, Brier Skill Score
                - ``"mse"``, Mean Square Error
                - ``"norm_aupdc"``,  Normalized Area under the Performance Diagram (Precision-Recall) Curve
                
            Otherwise, evaluation_fn can be any function of form, 
            `evaluation_fn(targets, predictions)` and must return a scalar value
        
        estimator_names : string, list of strings
        
            If using multiple estimators, you can pass a single (or subset of) estimator name(s) 
            to compute for. 
            
        subsample: float or integer (default=1.0 for no subsampling)
        
            - if value is between 0-1, it is interpreted as fraction of total X to use 
            - if value > 1, interpreted as the absolute number of random samples of X.
        
        n_jobs : interger or float (default=1; no multiprocessing)
        
            - if integer, interpreted as the number of processors to use for multiprocessing
            - if float between 0-1, interpreted as the fraction of proceesors to use for multiprocessing
        
        n_bootstrap: integer (default=None for no bootstrapping)
            Number of bootstrap resamples for computing confidence intervals on the feature pair rankings. 
        
        Returns
        ---------
        
        results_ds : xarray.Dataset
            Permutation importance-based feature interaction strength results
        
        
        Examples
        ---------
        >>> import pymint
        >>> # pre-fit estimators within pymint
        >>> estimators = pymint.load_models() 
        >>> X, y = pymint.load_data() # training data 
        >>> explainer = pymint.InterpretToolkit(estimators=estimators,
        ...                             X=X,
        ...                             y=y,
        ...                            )
        >>> important_vars = ['sfc_temp', 'temp2m', 'sfcT_hrs_bl_frez', 'tmp2m_hrs_bl_frez',
        ...      'uplwav_flux']
        >>> important_vars_2d = list(itertools.combinations(important_vars, r=2))
        >>> perm_based_interact_ds = explainer.perm_based_interaction(
        ...                          important_vars_2d, evaluation_fn='norm_aupdc',
        ...                         )
        """
        if estimator_names is None:
            estimator_names=self.estimator_names
        else:
            if is_str(estimator_names):
                estimator_names=[estimator_names]
                
        results_ds = self.global_obj.compute_interaction_rankings_performance_based(
            estimator_names, 
            features, 
            evaluation_fn=evaluation_fn,
            estimator_output=self.estimator_output, 
            subsample=subsample,
            n_bootstrap=n_bootstrap,
            n_jobs=n_jobs,
            verbose=verbose)
    
        self.attrs_dict['method'] = 'perm_based'
        self.attrs_dict['estimators used'] = estimator_names
        self.attrs_dict['estimator output'] = self.estimator_output
        self.attrs_dict['evaluation_fn'] = 'Interaction Importance' 
                        
        results_ds = self._append_attributes(results_ds)
        
        return results_ds
    
    
[docs]    def ice(self, features, n_bins=30, n_jobs=1, subsample=1.0, n_bootstrap=1, random_seed=1,):
        """
        Compute the indiviudal conditional expectations (ICE) [7]_.

        References
        ------------
        .. [7] https://christophm.github.io/interpretable-ml-book/ice.html
    

        Parameters
        -----------
        
        features : string or list of strings or 'all'
            Features to compute the ICE for.  if 'all', the method will compute 
            the ICE for all features. 
            
        n_bins : integer (default=30)
            Number of bins used to compute the ICE for. Bins are decided based 
            on percentile intervals to ensure the same number of samples are in 
            each bin. 
            
        n_jobs : float or integer (default=1)
            
            - if integer, interpreted as the number of processors to use for multiprocessing
            - if float, interpreted as the fraction of proceesors to use for multiprocessing
            
        subsample : float or integer (default=1.0)
            
            - if value between 0-1 interpreted as fraction of total X to use 
            - if value > 1, interpreted as the absolute number of random samples of X.
                
        n_bootstrap : integer (default=1; no bootstrapping)
            Number of bootstrap resamples for computing confidence intervals on the ICE curves.
                
        Returns
        ---------
        
        results : xarray.DataSet
            Main keys are the user-provided estimator names while the sub-key 
            are the features computed for. The items are data for the ICE curves. Also, 
            contains X data (feature values where the ICE curves were computed) for plotting. 
            
        Examples
        ---------
        >>> import pymint
        >>> # pre-fit estimators within pymint
        >>> estimators = pymint.load_models()
        >>> X, y = pymint.load_data() # training data 
        >>> explainer = pymint.InterpretToolkit(estimators=estimators,
        ...                             X=X,
        ...                             y=y,
        ...                            )
        >>> ice_ds = explainer.ice(features='all', subsample=200)    
  
        """
        if is_str(features):
            if features == 'all':
                features = self.feature_names
            else:
                features = [features]
                
        results_ds = self.global_obj._run_interpret_curves(method="ice",
                            features=features,
                            n_bins=n_bins,
                            n_jobs=n_jobs,
                            subsample=subsample,
                            n_bootstrap=n_bootstrap, 
                            random_seed=random_seed
                                                       )
        
        dimension = '2D' if isinstance(list(features)[0], tuple) else '1D'
        self.attrs_dict['method'] = 'ice'
        self.attrs_dict['dimension'] = dimension
        self.attrs_dict['features used'] = features 
        
        results_ds = self._append_attributes(results_ds)
      
        self.feature_used=features

        return results_ds

[docs]    def pd(self, features, n_bins=25, n_jobs=1, subsample=1.0, n_bootstrap=1, random_seed=42,):
        """
        Computes the 1D or 2D centered partial dependence (PD) [8]_.
        
        References
        ------------
        
        .. [8] https://christophm.github.io/interpretable-ml-book/pdp.html
        
        Parameters
        ----------
        
        features : string or list of strings or 'all'
            Features to compute the PD for.  if 'all', the method will compute 
            the PD for all features. 
            
        n_bins : integer (default=30)
            Number of bins used to compute the PD for. Bins are decided based 
            on percentile intervals to ensure the same number of samples are in 
            each bin. 
            
        n_jobs : float or integer (default=1)
            
            - if integer, interpreted as the number of processors to use for multiprocessing
            - if float, interpreted as the fraction of proceesors to use for multiprocessing
            
        subsample : float or integer (default=1.0)
            
            - if value between 0-1 interpreted as fraction of total X to use 
            - if value > 1, interpreted as the absolute number of random samples of X.
                
        n_bootstrap : integer (default=1; no bootstrapping)
            Number of bootstrap resamples for computing confidence intervals on the PD curves.
                
        Returns
        --------
        
        results : xarray.DataSet
            Partial dependence result dataset 
        
        Examples
        ---------
        >>> import pymint
        >>> # pre-fit estimators within pymint
        >>> estimators = pymint.load_models() 
        >>> X, y = pymint.load_data() # training data 
        >>> explainer = pymint.InterpretToolkit(estimators=estimators
        ...                             X=X,
        ...                             y=y,
        ...                            )
        >>> pd = explainer.pd(features='all')    
        """
        if is_str(features):
            if features == 'all':
                features = self.feature_names
            if features == 'all_2d':
                features = list(itertools.combinations(self.feature_names, r=2))
         
        results_ds = self.global_obj._run_interpret_curves(method="pd",
                            features=features,
                            n_bins=n_bins,
                            n_jobs=n_jobs,
                            subsample=subsample,
                            n_bootstrap=n_bootstrap, 
                            random_seed=random_seed)
        
        dimension = '2D' if isinstance( list(features)[0] , tuple) else '1D'
        self.attrs_dict['method'] = 'pd'
        self.attrs_dict['dimension'] = dimension
        self.attrs_dict['features used'] = features 
        
        results_ds = self._append_attributes(results_ds)
        self.features_used = features 
        
        return results_ds

[docs]    def ale(self, features=None, n_bins=30, n_jobs=1, subsample=1.0, n_bootstrap=1, random_seed=42, ):
        """
        Compute the 1D or 2D centered accumulated local effects (ALE) [9]_ [10]_.
        For categorical features, simply set the type of those features in the 
        dataframe as ``category`` and the categorical ALE will be computed. 

        References
        -----------
        
        .. [9] https://christophm.github.io/interpretable-ml-book/ale.html
        
        .. [10] Apley, D. W., and J. Zhu, 2016: Visualizing the Effects of Predictor Variables in 
                Black Box Supervised Learning Models. ArXiv. 
        
        
        Parameters
        ----------
        
        features : string or list of strings or 'all'
            Features to compute the PD for.  if 'all', the method will compute 
            the ALE for all features. 
            
        n_bins : integer (default=30)
            Number of bins used to compute the ALE for. Bins are decided based 
            on percentile intervals to ensure the same number of samples are in 
            each bin. 
            
        n_jobs : float or integer (default=1)
            
            - if integer, interpreted as the number of processors to use for multiprocessing
            - if float, interpreted as the fraction of proceesors to use for multiprocessing
            
        subsample : float or integer (default=1.0)
            
            - if value between 0-1 interpreted as fraction of total X to use 
            - if value > 1, interpreted as the absolute number of random samples of X.
                
        n_bootstrap : integer (default=1; no bootstrapping)
            Number of bootstrap resamples for computing confidence intervals on the ALE curves.
                
        Returns
        ----------
        
        results : xarray.DataSet
            ALE result dataset

        Raise
        ----------
        Exception
            Highly skewed data may not be divisable into n_bins given. In that case, calc_ale
            uses the max bins the data can be divided into. But a warning message is raised.
               
        Examples
        ---------
        >>> import pymint
        >>> estimators = pymint.load_models() # pre-fit estimators within pymint
        >>> X, y = pymint.load_data() # training data 
        >>> # Set the type for categorical features and InterpretToolkit with compute the 
        >>> # categorical ALE. 
        >>> X = X.astype({'urban': 'category', 'rural':'category'})
        >>> explainer = pymint.InterpretToolkit(estimators=estimators
        ...                             X=X,
        ...                             y=y,
        ...                            )
        >>> ale = explainer.ale(features='all') 
        """
        if is_str(features):
            if features == 'all':
                features = self.feature_names
            elif features == 'all_2d':
                features = list(itertools.combinations(self.feature_names, r=2))
            else:
                features = [features]
            
        results_ds = self.global_obj._run_interpret_curves(method="ale",
                            features=features,                            
                            n_bins=n_bins,
                            n_jobs=n_jobs,
                            subsample=subsample,
                            n_bootstrap=n_bootstrap, 
                            random_seed=random_seed)
        
        dimension = '2D' if isinstance( list(features)[0] , tuple) else '1D'
        self.attrs_dict['method'] = 'ale'
        self.attrs_dict['dimension'] = dimension
        self.attrs_dict['features used'] = features 

        results_ds = self._append_attributes(results_ds)
        self.features_used = features 

        return results_ds

[docs]    def friedman_h_stat(self, pd_1d, pd_2d, features, estimator_names=None, **kwargs):
        """
        Compute the second-order Friedman's H-statistic for computing feature interactions [11]_ [12]_. 
        Based on equation (44) from Friedman and Popescu (2008) [12]_. Only computes the interaction strength 
        between two features. In future versions of PyMint we hope to include the first-order H-statistics
        that measure the interaction between a single feature and the 
        remaining set of features.
        
        References
        -----------
        
        .. [11] https://christophm.github.io/interpretable-ml-book/interaction.html 
        .. [12] Friedman, J. H., and B. E. Popescu, 2008: Predictive learning via rule ensembles. 
                Ann Appl Statistics, 2, 916–954, https://doi.org/10.1214/07-aoas148.
       
        
        Parameters
        -----------
        
        pd_1d : xarray.Dataset
            1D partial dependence dataset. Results of :func:`~InterpretToolkit.pd` for ``features``
            
        pd_2d : xarray.Dataset
            2D partial dependence dataset. Results of :func:`~InterpretToolkit.pd`, but 2-tuple combinations 
            of ``features``. 
       
        features : list of 2-tuples of strings
            The pairs of features to compute the feature interaction between.
        
        estimator_names : string, list of strings (default is None)
        
            If using multiple estimators, you can pass a single (or subset of) estimator name(s) 
            to compute the H-statistic for. 
        
        
        Returns
        ----------
        
        results_ds : xarray.Dataset
            The second-order Friedman H-statistic for all estimators.
            
        Examples
        ---------
        >>> import pymint
        >>> # pre-fit estimators within pymint
        >>> estimators = pymint.load_models()
        >>> X, y = pymint.load_data() # training data 
        >>> explainer = pymint.InterpretToolkit(estimators=estimators
        ...                             X=X,
        ...                             y=y,
        ...                            )
        >>> pd_1d = explainer.pd(features='all')
        >>> pd_2d = explainer.pd(features='all_2d')
        >>> hstat = explainer.friedman_h_stat(pd_1d, pd_2d,)
        """
        if estimator_names is None:
            estimator_names = self.estimator_names
        else:
            if is_str(estimator_names):
                estimator_names = [estimator_names]
   
        results_ds = self.global_obj.compute_scalar_interaction_stats(
                                                    method = 'hstat',
                                                    data=pd_1d,
                                                    data_2d = pd_2d,
                                                    features=features,
                                                    estimator_names=estimator_names,
                                                    **kwargs,
                                                   ) 
    
        results_ds = self._append_attributes(results_ds)
    
        return results_ds
    
[docs]    def interaction_strength(self, ale, estimator_names=None, **kwargs):
        """
        Compute the InterAction Strength (IAS) statistic from Molnar et al. (2019) [5]_.
        The IAS varies between 0-1 where values closer to 0 indicate no feature interaction
        strength.

        Parameters
        ------------
        
        ale : xarray.Dataset 
        
            Results of :func:`~InterpretToolkit.ale`, but must be computed for all features
            
        estimator_names : string, list of strings (default is None)
        
            If using multiple estimators, you can pass a single (or subset of) estimator name(s) 
            to compute the IAS for. 
            
        kwargs : dict

            - subsample 
            - n_bootstrap 
            - estimator_output 

        Returns
        ----------
        
        results_ds : xarray.Dataset 
            Interaction strength result dataset
        
        Examples
        ---------
        >>> import pymint
        >>> # pre-fit estimators within pymint
        >>> estimators = pymint.load_models() 
        >>> X, y = pymint.load_data() # training data 
        >>> explainer = pymint.InterpretToolkit(estimators=estimators
        ...                             X=X,
        ...                             y=y,
        ...                            )
        >>> ale = explainer.ale(features='all')
        >>> ias = explainer.interaction_strength(ale)
        """
        if estimator_names is None:
            estimator_names = self.estimator_names
        else:
            if is_str(estimator_names):
                estimator_names = [estimator_names]

        # Check that ale_data is an xarray.Dataset
        if not isinstance(ale, xr.core.dataset.Dataset):
            raise ValueError("""
                                 ale must be an xarray.Dataset, 
                                 perferably generated by mintpy.InterpretToolkit.calc_ale to be formatted correctly
                                 """
                                )
        else:
            any_missing = all([m in ale.attrs['estimators used'] for m in estimator_names])
            if not any_missing:
                raise ValueError(f'ale does not contain data for all the estimator names given!')
     
        kwargs['estimator_output'] = self.estimator_output
    
        results_ds = self.global_obj.compute_scalar_interaction_stats(
                                                    method = 'ias',
                                                    data=ale,
                                                    estimator_names=estimator_names,
                                                    **kwargs, 
                                                   ) 
        results_ds = self._append_attributes(results_ds)
        
        return results_ds
    
    
    def _plot_interpret_curves(self, method, data, estimator_names, features=None, 
                               display_feature_names={}, display_units={}, 
                               to_probability=False, **kwargs):
        """
        FOR INTERNAL USE ONLY. 
        
        Handles 1D or 2D PD/ALE plots.
        """
        if features is None:
            try:
                features = self.features_used
            except:
                raise ValueError('No features were provided to plot!')
        else:
            if is_str(features):
                features=[features]
                
        if data.attrs['dimension'] == '2D':
            plot_obj = PlotInterpret2D()
            return plot_obj.plot_contours(method=method,
                                          data=data,
                                          estimator_names=estimator_names,
                                          features=features,
                                          display_feature_names=display_feature_names,
                                          display_units=display_units,
                                          to_probability = to_probability,
                                          **kwargs)
        else:
            base_font_size = 12 if len(features) <= 6 else 16
            base_font_size = kwargs.get('base_font_size', base_font_size) 
            plot_obj = PlotInterpretCurves(BASE_FONT_SIZE=base_font_size)
            return plot_obj.plot_1d_curve(method=method,
                                          data=data,
                                          estimator_names=estimator_names,
                                          features=features,
                                          display_feature_names=display_feature_names,
                                          display_units=display_units,
                                          to_probability = to_probability,
                                          **kwargs)

[docs]    def plot_pd(self, pd=None, features=None, estimator_names=None, 
                display_feature_names={}, display_units={}, 
                line_colors=None, to_probability=False, **kwargs):
        """
        Runs the 1D and 2D partial dependence plotting. 
      
        Parameters
        ----------
        
        pd : xarray.Dataset
            Results of :func:`~InterpretToolkit.pd` for
            ``features``.
            
        features : string, list of strings, list of 2-tuple of strings
            Features to plot the PD for.  To plot for 2D PD, 
            pass a list of 2-tuples of features.
            
        estimator_names : string, list of strings (default is None)
            If using multiple estimators, you can pass a single (or subset of) estimator name(s) 
            to plot for.
            
        display_feature_names : dict 
            For plotting purposes. Dictionary that maps the feature names 
            in the pandas.DataFrame to display-friendly versions.
            E.g., ``display_feature_names = { 'dwpt2m' : '$T_{d}$', }``
            
            The plotting code can handle latex-style formatting. 
        
        display_units : dict 
            For plotting purposes. Dictionary that maps the feature names 
            to their units. 
            E.g., ``display_units = { 'dwpt2m' : '$^\circ$C', }``
        
        line_colors : str or list of strs of len(estimators)
            User-defined colors for curve plotting.

        to_probability : boolean 
            If True, the values are multipled by 100. 
        
        Keyword arguments include arguments typically used for matplotlib. 
        

        Returns
        --------
        
        fig, axes: matplotlib figure instance and the corresponding axes 
        
        
        Examples
        ---------
        >>> import pymint
        >>> estimators = pymint.load_models() # pre-fit estimators within pymint
        >>> X, y = pymint.load_data() # training data 
        >>> explainer = pymint.InterpretToolkit(estimators=estimators
        ...                             X=X,
        ...                             y=y,
        ...                            )
        >>> pd = explainer.calc_pd(features='all')
        >>> # Provide a small subset of features to plot
        >>> important_vars = ['sfc_temp', 'temp2m', 'sfcT_hrs_bl_frez', 
        ...     'tmp2m_hrs_bl_frez','uplwav_flux']
        >>> explainer.plot_pd(pd, features=important_vars)
        
        """
        if estimator_names is None:
            estimator_names = self.estimator_names
        else:
            if is_str(estimator_names):
                estimator_names = [estimator_names]
                
        if pd.attrs['estimator_output'] == 'probability':
            to_probability=True
            
        if to_probability:
            kwargs['left_yaxis_label'] = 'Centered PD (%)'
        else:
            kwargs['left_yaxis_label'] = 'Centered PD'
            
        return self._plot_interpret_curves(
                               method='pd',
                               data=pd,
                               features=features,
                               estimator_names=estimator_names,
                               display_feature_names=display_feature_names,
                               display_units=display_units,
                               to_probability=to_probability,
                               line_colors=line_colors,            
                               **kwargs)

[docs]    def plot_ale(self, ale=None, features=None, estimator_names=None, 
                 display_feature_names={}, display_units={}, 
                 line_colors=None, to_probability=False, **kwargs):
        """
        Runs the 1D and 2D accumulated local effects plotting.
        
        Parameters
        ----------
        
        ale : xarray.Dataset
             Results of :func:`~InterpretToolkit.ale` for
            ``features``.
        
        features : string, list of strings, list of 2-tuple of strings
            Features to plot the PD for.  To plot for 2D PD, 
            pass a list of 2-tuples of features.
            
        estimator_names : string, list of strings (default is None)
            If using multiple estimators, you can pass a single (or subset of) estimator name(s) 
            to plot for. 
        
        display_feature_names : dict 
            For plotting purposes. Dictionary that maps the feature names 
            in the pandas.DataFrame to display-friendly versions.
            E.g., ``display_feature_names = { 'dwpt2m' : '$T_{d}$', }``
            
            The plotting code can handle latex-style formatting. 
        
        display_units : dict 
            For plotting purposes. Dictionary that maps the feature names 
            to their units. 
            E.g., ``display_units = { 'dwpt2m' : '$^\circ$C', }``
        
        line_colors : str or list of strs of len(estimators)
            User-defined colors for curve plotting.

        to_probability : boolean 
            If True, the values are multipled by 100. 
        
        Keyword arguments include arguments typically used for matplotlib. 
            E.g., 
            figsize, hist_color,  
        
        Returns
        --------
        
        fig, axes: matplotlib figure instance and the corresponding axes 
        
        
        Examples
        ---------
        >>> import pymint
        >>> # pre-fit estimators within pymint
        >>> estimators = pymint.load_models() 
        >>> X, y = pymint.load_data() # training data 
        >>> explainer = pymint.InterpretToolkit(estimators=estimators
        ...                             X=X,
        ...                             y=y,
        ...                            )
        >>> ale = explainer.ale(features='all')
        >>> # Provide a small subset of features to plot
        >>> important_vars = ['sfc_temp', 'temp2m', 'sfcT_hrs_bl_frez', 
        ...     'tmp2m_hrs_bl_frez','uplwav_flux']
        >>> explainer.plot_ale(ale, features=important_vars)
        
        .. image :: ../../images/ale_1d.png
        """
        if estimator_names is None:
            estimator_names = self.estimator_names
        else:
            if is_str(estimator_names):
                estimator_names = [estimator_names]
        
        if ale.attrs['estimator_output'] == 'probability':
            to_probability=True
        
        if to_probability:
            kwargs['left_yaxis_label'] = 'Centered ALE (%)'
        else:
            kwargs['left_yaxis_label'] = 'Centered ALE'
        
        return self._plot_interpret_curves(
                               method = 'ale',
                               data=ale,
                               features=features,
                               estimator_names=estimator_names,
                               display_feature_names=display_feature_names,
                               display_units=display_units,
                               to_probability=to_probability,
                               line_colors=line_colors,
                               **kwargs)

[docs]    def local_contributions(self, 
                           method='shap', 
                           performance_based=False,
                           n_samples=100, 
                           shap_kwargs={'algorithm' : 'auto'},
                           ):
        """
        Computes the individual feature contributions to a predicted outcome for
        a series of examples either based on tree interpreter (only Tree-based methods) 
        or Shapley Additive Explanations. 

        Parameters
        -----------
        
        method : ``'shap'`` or ``'tree_interpreter'``
            Can use SHAP or treeinterpreter to compute the feature contributions.
            SHAP is estimator-agnostic while treeinterpreter can only be used on
            select decision-tree based estimators in scikit-learn. SHAP will attempt 
            to first use the Tree-based explainer and if that fails, then the 
            Kernel-based explainer. 

        performance_based : boolean (default=False)
            If True, will average feature contributions over the best and worst
            performing of the given X. The number of examples to average over
            is given by n_samples

        n_samples : interger (default=100)
            Number of samples to compute average over if performance_based = True

        shap_kwargs : dict
            Arguments passed to the shap.Explainer object. See 
            https://shap.readthedocs.io/en/latest/generated/shap.Explainer.html#shap.Explainer
            for details. The main two arguments supported in PyMint is the masker and 
            algorithm options. By default, the masker option uses 
            masker = shap.maskers.Partition(X, max_samples=100, clustering="correlation") for
            hierarchical clustering by correlations. You can also provide a background dataset
            e.g., background_dataset = shap.sample(X, 100).reset_index(drop=True). The algorithm 
            option is set to "auto" by default. 
            
            - masker
            - algorithm 


        Returns
        --------
        
        results_df : nested pandas.DataFrame
            For each example, contributions from each feature plus the bias 
            The dataframe is nested by the estimator names and additional keys
            if performance_based=True. 
            
        
        Examples
        ---------
        >>> import pymint
        >>> import shap
        >>> # pre-fit estimators within pymint
        >>> estimators = pymint.load_models() 
        >>> X, y = pymint.load_data() # training data 
        >>> # Only give the X you want contributions for. 
        >>> # In this case, we are using a single example. 
        >>> single_example = X.iloc[[0]]
        >>> explainer = pymint.InterpretToolkit(estimators=estimators
        ...                             X=single_example,
        ...                            )
        >>> # Create a background dataset; randomly sample 100 X
        >>> background_dataset = shap.sample(X, 100)
        >>> contrib_ds = explainer.local_contributions(method='shap', 
        ...                   background_dataset=background_dataset)

        >>> # For the performance-based contributions, 
        >>> # provide the full set of X and y values.
        >>> explainer = pymint.InterpretToolkit(estimators=estimators
        ...                             X=X,
        ...                            y=y,
        ...                            )
        >>> contrib_ds = explainer.local_contributions(method='shap', 
        ...                   background_dataset=background_dataset, 
        ...                   performance_based=True, n_samples=100)

        """
        results_df = self.local_obj._get_local_prediction(method=method,
                                            performance_based=performance_based,
                                            n_samples=n_samples, 
                                            shap_kwargs=shap_kwargs)

        # Add metadata
        self.attrs_dict['method'] = method
        self.attrs_dict['n_samples'] = n_samples
        self.attrs_dict['performance_based'] = str(performance_based)
        self.attrs_dict['feature_names'] = self.feature_names
        results_df = self._append_attributes(results_df)

        return results_df

[docs]    def plot_contributions(self, 
                           contrib=None,
                           features=None, 
                           estimator_names=None,
                           display_feature_names={}, 
                           **kwargs):
        """
        Plots the feature contributions.
        
        Parameters
        ------------
        contrib : Nested pandas.DataFrame
            Results of :func:`~InterpretToolkit.local_contributions`

        features : string or list of strings (default=None)
        
               Features to plot. If None, all features are eligible to be plotted. 
               However, the default number of features to plot is 10. Can be set 
               by n_vars (see keyword arguments).
            
        estimator_names : string, list of strings (default is None)
        
            If using multiple estimators, you can pass a single (or subset of) estimator name(s) 
            to compute the IAS for. 

        display_feature_names : dict 
            For plotting purposes. Dictionary that maps the feature names 
            in the pandas.DataFrame to display-friendly versions.
            E.g., display_feature_names = { 'dwpt2m' : 'T$_{d}$', }
            The plotting code can handle latex-style formatting.

        Keyword arguments include arguments typically used for matplotlib

        Returns
        ---------
        
        fig: matplotlib figure instance
        
        Examples
        ---------
        >>> import pymint
        >>> import shap
        >>> estimators = pymint.load_models() # pre-fit estimators within pymint
        >>> X, y = pymint.load_data() # training data 
        >>> # Only give the X you want contributions for. 
        >>> # In this case, we are using a single example. 
        >>> single_example = X.iloc[[0]]
        >>> explainer = pymint.InterpretToolkit(estimators=estimators,
        ...                             X=single_example,
        ...                            )
        >>> # Create a background dataset; randomly sample 100 X
        >>> background_dataset = shap.sample(X, 100)
        >>> contrib_ds = explainer.local_contributions(method='shap', 
        ...                   background_dataset=background_dataset)

        >>> explainer.plot_contributions(contrib_ds)
        
        .. image :: ../../images/feature_contribution_single.png
        """
        if estimator_names is None:
            estimator_names = contrib.attrs['estimators used']
        elif is_str(estimator_names):
            estimator_names=[estimator_names]
        
        estimator_output = contrib.attrs['estimator_output']
        if features is None:
            features = contrib.attrs['feature_names']
            
        # initialize a plotting object
        only_one_panel = (contrib.index[0][0] == 'non_performance' and len(estimator_names)==1)
        base_font_size = kwargs.get('base_font_size', 16 if only_one_panel else 11)
        plot_obj = PlotFeatureContributions(BASE_FONT_SIZE=base_font_size)
        kwargs['estimator_output'] = self.estimator_output
        
        return plot_obj.plot_contributions(data=contrib,
                                           estimator_names = estimator_names,
                                           features=features,
                                           display_feature_names=display_feature_names,
                                           **kwargs)

[docs]    def shap(self, shap_kwargs={'masker' : None, 'algorithm' : 'auto'}):
        """
        Compute the SHapley Additive Explanations (SHAP) values [13]_ [14]_ [15]_. The calculations starts
        with the Tree-based explainer and then defaults to the Kernel-based explainer for
        non-tree based estimators. If using a non-tree based estimators, then you must provide a 
        background dataset 
        
        Parameters
        ------------------ 
        background_dataset : array of shape (n_samples, n_features)
            A representative (often a K-means or random sample) subset of the
            data used to train the ML estimator. Used for the background dataset
            to compute the expected values for the SHAP calculations.
            Only required for non-tree based methods.

        Returns
        -------------------
        
        results : dict
            Dictionary where the keys represent estimator names, and the
            values represent a tuple of SHAP values and the bias.
            shap_values is of type numpy.array (n_samples, n_features)
            bias is of type numpy.array (1, n_features)
       
       
        References
        ------------
        .. [13] https://christophm.github.io/interpretable-ml-book/shap.html
        .. [14] Lundberg, S. M., G. G. Erion, and S.-I. Lee, 2018: Consistent Individualized 
                Feature Attribution for Tree Ensembles. Arxiv,.
        .. [15] Lundberg, S. M., and Coauthors, 2020: From local explanations to global understanding 
                with explainable AI for trees. Nat Mach Intell, 2, 56–67, https://doi.org/10.1038/s42256-019-0138-9.
       
       
        Examples
        ---------
        >>> import pymint
        >>> import shap
        >>> # pre-fit estimators within pymint
        >>> estimators = pymint.load_models() 
        >>> X, y = pymint.load_data() # training data 
        >>> explainer = pymint.InterpretToolkit(estimators=estimators
        ...                             X=X,
        ...                             y=y,
        ...                            )
        >>> # Create a background dataset; randomly sample 100 X
        >>> background_dataset = shap.sample(X, 100)
        >>> shap_results = explainer.shap(background_dataset)
        """
        results = {}
        
        for estimator_name, estimator in self.estimators.items():
            shap_values, bias = self.local_obj._get_shap_values(estimator=estimator,
                                                 X=self.X, shap_kwargs=shap_kwargs,)
            results[estimator_name] = (shap_values, bias)
        
        return results


[docs]    def plot_shap(self, 
                  plot_type='summary',
                  shap_values=None,
                  features=None, 
                  display_feature_names={},
                  display_units={},
                  **kwargs):
        """
        Plot the SHapley Additive Explanations (SHAP) [13]_ [14]_ [15]_ summary plot or dependence 
        plots for various features.
        
        Parameters
        -----------

        plot_type : ``'summary'`` or ``'dependence'`` 
            if 'summary', plots a feature importance-style plot 
            if 'dependence', plots a partial depedence style plot 

        shap_values : array of shape (n_samples, n_features) 
        
            SHAP values 
        
        features : string or list of strings (default=None)
            features to plots if plot_type is 'dependence'.
        
        display_feature_names : dict 
            For plotting purposes. Dictionary that maps the feature names 
            in the pandas.DataFrame to display-friendly versions.
            E.g., ``display_feature_names = { 'dwpt2m' : '$T_{d}$', }``
            The plotting code can handle latex-style formatting. 
        
        display_units : dict 
            For plotting purposes. Dictionary that maps the feature names
            to their units. 
            E.g., ``display_units = { 'dwpt2m' : '$^\circ$C', }``
        
        to_probability : boolean
            if True, values are multiplied by 100. 

        Returns
        -----------------------
        fig: matplotlib figure instance
        
        Examples
        ---------
        >>> import pymint
        >>> import shap
        >>> # pre-fit estimators within pymint
        >>> estimators = pymint.load_models() 
        >>> X, y = pymint.load_data() # training data 
        >>> explainer = pymint.InterpretToolkit(estimators=estimators
        ...                             X=X,
        ...                             y=y,
        ...                            )
        >>> # Create a background dataset; randomly sample 100 X
        >>> background_dataset = shap.sample(X, 100)
        >>> shap_results = explainer.shap(background_dataset)
        >>> print(estimator_names)
        ... ['Random Forest', ]
        >>> shap_values, bias = shap_results[estimator_names[0]]
        >>> # Plot the SHAP-summary style plot 
        >>> explainer.plot_shap(plot_type='summary',shap_values=shap_values,)
        
        >>> # Plot the SHAP-dependence style plot 
        >>> important_vars = ['sfc_temp', 'temp2m', 'sfcT_hrs_bl_frez', 'tmp2m_hrs_bl_frez','uplwav_flux']
        >>> explainer.plot_shap(plot_type='dependence',
        ...            shap_values=shap_values, features=important_vars)

        .. image :: ../../images/shap_dependence.png
        
        """
        to_probability = True if self.estimator_output == 'probability' else False 
        if to_probability:
            shap_values_copy = np.copy(shap_values)
            shap_values_copy *= 100.
        else:
            shap_values_copy = shap_values
            
        # initialize a plotting object
        if plot_type == 'summary':
            fontsize=12
        else:
            fontsize=12 if len(features) <= 6 else 16

        base_font_size = kwargs.get('base_font_size', fontsize)
        plot_obj = PlotFeatureContributions(BASE_FONT_SIZE=base_font_size)
        plot_obj.feature_names = self.feature_names
        plot_obj.plot_shap(shap_values=shap_values_copy,
                           X=self.X,
                           features=features,
                           plot_type=plot_type,
                           display_feature_names=display_feature_names,
                           display_units=display_units,
                           **kwargs
                          )

[docs]    def plot_importance(self, 
                        data,
                        panels,
                        plot_correlated_features=False,
                        **kwargs):
        """
        Method for plotting the permutation importance and other ranking-based results.

        Parameters
        -------------
        panels: List of 2-tuple of (estimator name, method) to determine the sub-panel
                matrixing for the plotting. E.g., If you wanted to compare multi-pass to 
                single-pass permutation importance for a random forest: 
               ``panels  = [('Random Forest', 'multipass'), ('Random Forest', 'singlepass')``
                The available ranking methods in PyMint include 'multipass', 'singlepass', 
                'perm_based', 'ale_variance', or 'ale_variance_interactions'. 
                
        data :  list of xarray.Datasets
            Results from 
            
            - :func:`~InterpretToolkit.permutation_importance`
            - :func:`~InterpretToolkit.ale_variance`
            - :func:`~InterpretToolkit.friedman_h_stat`
            - :func:`~InterpretToolkit.perm_based_interaction`
            
            For each element in panels, there needs to be a corresponding element in data. 

        columns : list of strings
            What will be the columns of the plot? These can be x-axis label (default is
            the different estimator names)
        
        rows : list of strings
            Y-axis label or multiple labels for each row in a multi-panel plot. (default is None). 
        
        plot_correlated_features : boolean
            If True, pairs of features with a linear correlation coefficient > 0.8 
            are annotate/paired by bars or color-coding. This is useful for identifying
            spurious rankings due to the correlations. 
        
        kwargs : keyword arguments
        
        num_vars_to_plot : integer
            Number of features to plot from permutation importance calculation.

        Returns
        --------
        fig: matplotlib figure instance
        
        
        Examples
        -------
        >>> import pymint
        >>> # pre-fit estimators within pymint
        >>> estimators = pymint.load_models() 
        >>> X, y = pymint.load_data() # training data 
        >>> explainer = pymint.InterpretToolkit(estimators=estimators,
        ...                             X=X,
        ...                             y=y,
        ...                            )
        >>> perm_imp_results = explainer.permutation_importance( 
        ...                       n_vars=10,
        ...                       evaluation_fn = 'norm_aupdc',
        ...                       direction = 'backward',
        ...                       subsample=0.5,
        ...                       n_bootstrap=20, 
        ...                       )
        >>> explainer.plot_importance(data=perm_imp_results, method='multipass')
        
        
        >>> #If we want to annonate pairs of highly correlated feature pairs
        >>> explainer.plot_importance(data=perm_imp_results, method='multipass', 
        ...                     plot_correlated_features=True)
        
        .. image :: ../../images/multi_pass_perm_imp.png
        
        """
        if is_list(data):
            assert len(data) == len(panels), 'Panels and Data must have the same number of elements'
        else:
            data = [data] 
        
        if len(data) != len(panels):
            # Assuming that data contains multiple models. 
            given_estimator_names = [m[1] for m in panels]
            available_estimators = [f.split('rankings__')[1] for f in list(data[0].data_vars) if 'rank' in f]
            missing = np.array([True if f not in available_estimators else False  for f in given_estimator_names])
            missing_estimators = list(np.array(given_estimator_names)[missing])
            if any(missing):
                txt = ''
                for i in missing_estimators:
                    txt += (i + ', ')
                raise ValueError (f"""Results for {txt} are not in the given dataset. 
                      Check for possible spelling errors""")
               
            data *= len(panels)
  
        for r, (method, estimator_name) in zip(data, panels):
            available_methods = [d.split('__')[0] for d in list(r.data_vars) if f'rankings__{estimator_name}' in d]
            if f"{method}_rankings" not in available_methods:
                raise ValueError(f"""{method} does not match the available methods for this item({available_methods}). 
                         Ensure that the elements of data match up with those panels!
                         Also check for any possible spelling error. 
                         """)
     
        estimator_output = kwargs.get('estimator_output', self.estimator_output)
        kwargs.pop('estimator_output', None)
        
        # initialize a plotting object
        base_font_size = kwargs.get('base_font_size', 12)
        plot_obj = PlotImportance(BASE_FONT_SIZE=base_font_size)

        if plot_correlated_features:
            kwargs['X'] = self.X

        return plot_obj.plot_variable_importance(data,
                                                panels=panels, 
                                                plot_correlated_features=plot_correlated_features,
                                                 estimator_output=estimator_output,
                                                 **kwargs)


[docs]    def plot_box_and_whisker(self, important_vars, example, 
                             display_feature_names={}, display_units={}, **kwargs):
        """
        Plot the training dataset distribution for a given set of important variables
        as a box-and-whisker plot. The user provides a single example, which is highlighted
        over those examples. Useful for real-time explainability. 
        
        Parameters:
        ----------------
        
        important_vars : str or list of strings
            List of features to plot 
        
        example : Pandas Series, shape = (important_vars,) 
            Single row dataframe to be overlaid, must have columns equal to
            the given important_vars
               
        
        """
        if not is_list(important_vars):
            important_vars = [important_vars]
        
        axis = 'columns' if isinstance(example, pd.DataFrame) else 'index'
        if set(getattr(example, axis)) != set(important_vars):
            raise ValueError('The example dataframe/series must have important_vars as columns!')
        
        f, axes = box_and_whisker(self.X, 
                                  top_preds=important_vars, 
                                  example=example, 
                                 display_feature_names=display_feature_names,
                                 display_units=display_units, 
                                 **kwargs)
        return f, axes 
    
[docs]    def plot_scatter(self, features, kde=True, 
                         subsample=1.0, display_feature_names={}, display_units={}, **kwargs):
        """
        2-D Scatter plot of ML model predictions. If kde=True, it will plot KDE contours 
        overlays to show highest concentrations. If the model type is classification, then
        the code will plot KDE contours per class. 
        """
        # TODO: Handle plotting multiple models! 
        # TODO: Determining if it is raw or probability (multiple classes too!) 
        # if there is more than a couple classes, then only plot one kde contours
        
        # Are features in X? 
        bad_features = [f for f in features if f not in self.feature_names]
        if len(bad_features) > 0:
            raise ValueError(f'{bad_features} is not a valid feature. Check for possible spelling errors!')
        
        # initialize a plotting object
        base_font_size = kwargs.get('base_font_size', 12)
        plot_obj = PlotScatter(base_font_size)
        
        f, axes = plot_obj.plot_scatter(self.estimators,
                   X=self.X, 
                   y=self.y, 
                   features=features, 
                   display_feature_names=display_feature_names,
                   display_units = display_units,
                   subsample=subsample, 
               peak_val=None, kde=kde, **kwargs)
        
        return f, axes
    
    
[docs]    def get_important_vars(self, perm_imp_data, multipass=True, n_vars=10, combine=False):
        """
        Retrieve the most important variables from permutation importance.
        Can combine rankings from different estimators and only keep those variables that
        occur in more than one estimator. 

        Parameters
        ------------
        
        perm_imp_data : xarray.Dataset
            Permutation importance result dataset

        multipass : boolean (defaults to True)
        
            if True, return the multipass rankings else returns the singlepass rankings

        n_vars : integer (default=10)
            Number of variables to retrieve if multipass=True.

        combine : boolean  (default=False)
            If combine=True, n_vars can be set such that you only include a certain amount of
            top features from each estimator. E.g., n_vars=5 and combine=True means to combine
            the top 5 features from each estimator into a single list.

        Examples
        -------
            if combine=True
                results : list 
                    List of top features from a different estimators.
            if combine=False
                results : dict
                    keys are the estimator names and items are the
                    top features.
                    
        Examples
        ---------
        >>> import pymint
        >>> # pre-fit estimators within pymint
        >>> estimators = pymint.load_models() 
        >>> X, y = pymint.load_data() # training data 
        >>> explainer = pymint.InterpretToolkit(estimators=estimators
        ...                             X=X,
        ...                             y=y,
        ...                            )
        >>> perm_imp_data = explainer.permutation_importance( 
        ...                       n_vars=10,
        ...                       evaluation_fn = 'norm_aupdc',
        ...                       direction = 'backward',
        ...                       subsample=0.5,
        ...                       n_bootstrap=20, 
        ...                       )
        >>> important_vars = explainer.get_important_vars(perm_imp_data, 
        ...        multipass=True, n_vars=5, combine=False)
        ...
        >>> # set combine=True
        >>> important_vars = explainer.get_important_vars(perm_imp_data, 
        ...        multipass=True, n_vars=5, combine=True)       
        """
        results = retrieve_important_vars(perm_imp_data, 
                                          estimator_names=self.estimator_names, 
                                          multipass=multipass)
        if not combine:
            return results
        else:
            return combine_top_features(results, n_vars=n_vars)

[docs]    def load(self, fnames, dtype='dataset'):
        """
        Load results of a computation (permutation importance, calc_ale, calc_pd, etc)

        Parameters
        ----------
        fnames : string or list of strings
            File names of dataframes or datasets to load. 
            
        dtype : 'dataset' or 'dataframe'
            Indicate whether you are loading a set of xarray.Datasets 
            or pandas.DataFrames
           
        Returns
        --------
        
        results : xarray.DataSet or pandas.DataFrame
            data for plotting purposes
            
        Examples
        ---------
        >>> import pymint
        >>> explainer = pymint.InterpretToolkit()
        >>> fname = 'path/to/your/perm_imp_results'
        >>> perm_imp_data = explainer.load(fnames=fname, dtype='dataset')     
            
        """
        if dtype == 'dataset':
            results = load_netcdf(fnames=fnames)
        elif dtype == 'dataframe':
            results = load_dataframe(fnames=fnames) 
        else:
            raise ValueError('dtype must be "dataset" or "dataframe"!')
       
        for s in [self, self.global_obj, self.local_obj]:
            try:
                setattr(s, 'estimator_output', results.attrs['estimator_output'])
                estimator_names = [results.attrs['estimators used']]
            except:
                setattr(s, 'estimator_output', results.attrs['model_output'])
                estimator_names = [results.attrs['models used']]
            
            if not is_list(estimator_names):
                estimator_names = [estimator_names]

            if (any(is_list(i) for i in estimator_names)):
                estimator_names = estimator_names[0] 
            
            setattr(s, 'estimator_names', estimator_names)
            setattr(s, 'estimators used', estimator_names) 
            
        return results

[docs]    def save(self, fname, data):
        """
        Save results of a computation (permutation importance, calc_ale, calc_pd, etc)

        Parameters
        ----------
        fname : string 
            filename to store the results in (including path)
        data : InterpretToolkit results
            the results of a InterpretToolkit calculation. Can be a dataframe or dataset.

        Examples
        -------
        >>> import pymint
        >>> estimators = pymint.load_models() # pre-fit estimators within pymint
        >>> X, y = pymint.load_data() # training data 
        >>> explainer = pymint.InterpretToolkit(estimators=estimators
        ...                             X=X,
        ...                             y=y,
        ...                            )
        >>> perm_imp_results = explainer.calc_permutation_importance( 
        ...                       n_vars=10,
        ...                       evaluation_fn = 'norm_aupdc',
        ...                       direction = 'backward',
        ...                       subsample=0.5,
        ...                       n_bootstrap=20, 
        ...                       )
        >>> fname = 'path/to/save/the/file'
        >>> explainer.save(fname, perm_imp_results) 
        """
        if is_dataset(data):
            save_netcdf(fname=fname,ds=data)
        elif is_dataframe(data):
            save_dataframe(fname=fname, dframe=data)
        else:
            raise TypeError(f'data is not a pandas.DataFrame or xarray.Dataset. The type is {type(data)}.')