Source code for bluemath_tk.datamining.pca

from typing import List, Union

import cartopy.crs as ccrs
import numpy as np
import pandas as pd
import xarray as xr
from sklearn.decomposition import PCA as PCA_
from sklearn.decomposition import IncrementalPCA as IncrementalPCA_
from sklearn.preprocessing import StandardScaler

from ..core.decorators import validate_data_pca
from ._base_datamining import BaseReduction



[docs]
class PCAError(Exception):
    """
    Custom exception for PCA class.
    """

    def __init__(self, message: str = "PCA error occurred."):
        self.message = message
        super().__init__(self.message)




[docs]
class PCA(BaseReduction):
    """
    Principal Component Analysis (PCA) class.

    Attributes
    ----------
    n_components : Union[int, float]
        The number of components or the explained variance ratio.
    is_incremental : bool
        Indicates whether Incremental PCA is used.
    is_fitted : bool
        Indicates whether the PCA model has been fitted.
    scaler : StandardScaler
        The scaler used for standardizing the data, in case the data is standarized.
    vars_to_stack : List[str]
        The list of variables to stack.
    window_stacked_vars : List[str]
        The list of variables with windows.
    coords_to_stack : List[str]
        The list of coordinates to stack.
    coords_values : dict
        The values of the data coordinates used in fitting.
    pca_dim_for_rows : str
        The dimension for rows in PCA.
    windows_in_pca_dim_for_rows : dict
        The windows in PCA dimension for rows.
    value_to_replace_nans : dict
        The values to replace NaNs in the dataset.
    nan_threshold_to_drop : dict
        The threshold percentage to drop NaNs for each variable.
    num_cols_for_vars : int
        The number of columns for variables.
    pcs : xr.Dataset
        The Principal Components (PCs).

    Examples
    --------
    .. jupyter-execute::

        from bluemath_tk.core.data.sample_data import get_2d_dataset
        from bluemath_tk.datamining.pca import PCA

        ds = get_2d_dataset()

        pca = PCA(
            n_components=5,
            is_incremental=False,
            debug=True,
        )
        pca.fit(
            data=ds,
            vars_to_stack=["X", "Y"],
            coords_to_stack=["coord1", "coord2"],
            pca_dim_for_rows="coord3",
            windows_in_pca_dim_for_rows={"X": [1, 2, 3]},
            value_to_replace_nans={"X": 0.0},
            nan_threshold_to_drop={"X": 0.95},
        )
        pcs = pca.transform(
            data=ds,
        )
        reconstructed_ds = pca.inverse_transform(PCs=pcs)
        eofs = pca.eofs
        explained_variance = pca.explained_variance
        explained_variance_ratio = pca.explained_variance_ratio
        cumulative_explained_variance_ratio = pca.cumulative_explained_variance_ratio

        # Save the full class in a pickle file
        pca.save_model("pca_model.pkl")

        # Plot the calculated EOFs
        pca.plot_eofs(vars_to_plot=["X", "Y"], num_eofs=3)

    References
    ----------
    [1] https://scikit-learn.org/stable/modules/generated/sklearn.decomposition.PCA.html

    [2] https://scikit-learn.org/stable/modules/generated/sklearn.decomposition.IncrementalPCA.html

    [3] https://www.sciencedirect.com/science/article/abs/pii/S0378383911000676
    """

    def __init__(
        self,
        n_components: Union[int, float] = 0.98,
        is_incremental: bool = False,
        debug: bool = False,
    ):
        """
        Initialize the PCA class.

        Parameters
        ----------
        n_components : int or float, optional
            Number of components to keep. If 0 < n_components < 1, it represents the
            proportion of variance to be explained by the selected components. If
            n_components >= 1, it represents the number of components to keep. Default is 0.98.
        is_incremental : bool, optional
            If True, use Incremental PCA which is useful for large datasets. Default is False.
        debug : bool, optional
            If True, enable debug mode. Default is False.

        Raises
        ------
        ValueError
            If n_components is less than or equal to 0.
        TypeError
            If n_components is not an integer when it is greater than or equal to 1.
        """

        initial_msg = f"""
        -------------------------------------------------------------------
        | Initializing PCA reduction model with the following parameters:
        |    - n_components: {n_components}
        |    - is_incremental: {is_incremental}
        | For more information, please refer to the documentation.
        -------------------------------------------------------------------
        """
        print(initial_msg)

        super().__init__()
        self.set_logger_name(
            name=self.__class__.__name__, level="DEBUG" if debug else "INFO"
        )

        if n_components <= 0:
            raise ValueError("Number of components must be greater than 0.")
        elif n_components >= 1:
            if not isinstance(n_components, int):
                raise TypeError("Number of components must be an integer when >= 1.")
            self.logger.info(f"Number of components: {n_components}")
        else:
            self.logger.info(f"Explained variance ratio: {n_components}")
        self.n_components = n_components
        if is_incremental:
            self.logger.info("Using Incremental PCA")
            self._pca = IncrementalPCA_(n_components=self.n_components)
        else:
            self.logger.info("Using PCA")
            self._pca = PCA_(n_components=self.n_components)

        self.is_fitted: bool = False
        self.is_incremental = is_incremental
        self._data: xr.Dataset = xr.Dataset()
        self._window_processed_data: xr.Dataset = xr.Dataset()
        self._stacked_data_matrix: np.ndarray = np.array([])
        self._standarized_stacked_data_matrix: np.ndarray = np.array([])
        self.scaler: StandardScaler = StandardScaler()
        self.vars_to_stack: List[str] = []
        self.window_stacked_vars: List[str] = []
        self.coords_to_stack: List[str] = []
        self.coords_values: dict = {}
        self.pca_dim_for_rows: str = None
        self.windows_in_pca_dim_for_rows: dict = {}
        self.value_to_replace_nans: dict = {}
        self.nan_threshold_to_drop: dict = {}
        self.not_nan_positions: dict = {}
        self.num_cols_for_vars: int = None
        self.pcs: xr.Dataset = None

        # Exclude attributes from beign saved with pca.save_model()
        self._exclude_attributes = [
            "_data",
            "_window_processed_data",
            "_stacked_data_matrix",
            "_standarized_stacked_data_matrix",
        ]

    @property
    def pca(self) -> Union[PCA_, IncrementalPCA_]:
        """
        Returns the PCA or IncrementalPCA instance used for dimensionality reduction.
        """

        return self._pca

    @property
    def data(self) -> xr.Dataset:
        """
        Returns the raw data used for PCA.
        """

        return self._data

    @property
    def window_processed_data(self) -> xr.Dataset:
        """
        Return the window processed data used for PCA.
        """

        return self._window_processed_data

    @property
    def stacked_data_matrix(self) -> np.ndarray:
        """
        Return the stacked data matrix.
        """

        return self._stacked_data_matrix

    @property
    def standarized_stacked_data_matrix(self) -> np.ndarray:
        """
        Return the standarized stacked data matrix.
        """

        return self._standarized_stacked_data_matrix

    @property
    def eofs(self) -> xr.Dataset:
        """
        Return the Empirical Orthogonal Functions (EOFs).
        """

        return self._reshape_EOFs(destandarize=False)

    @property
    def explained_variance(self) -> np.ndarray:
        """
        Return the explained variance of the PCA model.
        """

        return self.pca.explained_variance_

    @property
    def explained_variance_ratio(self) -> np.ndarray:
        """
        Return the explained variance ratio of the PCA model.
        """

        return self.pca.explained_variance_ratio_

    @property
    def cumulative_explained_variance_ratio(self) -> np.ndarray:
        """
        Return the cumulative explained variance ratio of the PCA model.
        """

        return np.cumsum(self.explained_variance_ratio)

    @property
    def pcs_df(self) -> pd.DataFrame:
        """
        Returns the principal components as a DataFrame.
        """

        if self.pcs is not None:
            return pd.DataFrame(
                data=self.pcs["PCs"].values,
                columns=[f"PC{i + 1}" for i in range(self.pca.n_components_)],
                index=self.pcs[self.pca_dim_for_rows].values,
            )
        else:
            raise PCAError(
                "PCA model must be fitted and transformed before calling pcs_df"
            )

    def _generate_stacked_data(self, data: xr.Dataset) -> np.ndarray:
        """
        Generate stacked data matrix.

        Parameters
        ----------
        data : xr.Dataset
            The data to stack.

        Returns
        -------
        np.ndarray
            The stacked data matrix
        """

        self.logger.info(
            f"Generating data matrix with variables to stack: {self.vars_to_stack} and coordinates to stack: {self.coords_to_stack}"
        )

        self.num_cols_for_vars = 1
        for coord_to_stack in self.coords_to_stack:
            self.num_cols_for_vars *= len(data[coord_to_stack])
        tmp_stacked_data = data.stack(positions=self.coords_to_stack)

        cleaned_vars_to_stack = []
        for var_to_clean in self.window_stacked_vars:
            var_to_clean_values = tmp_stacked_data[var_to_clean].values
            if var_to_clean_values.ndim == 1:
                var_to_clean_values = var_to_clean_values.reshape(-1, 1)
            var_to_clean_threshold = self.nan_threshold_to_drop.get(
                var_to_clean,
                self.nan_threshold_to_drop.get(
                    var_to_clean[:-2],
                    self.nan_threshold_to_drop.get(var_to_clean[:-3], 0.90),
                ),
            )
            not_nan_positions = np.where(
                np.mean(~np.isnan(var_to_clean_values), axis=0) > var_to_clean_threshold
            )[0]
            self.logger.warning(
                f"Using {len(not_nan_positions)} out of {var_to_clean_values.shape[1]} available variables"
                "If this is originated by using few times, please check 'nan_threshold_to_drop' parameter in fit method"
            )
            var_value_to_replace_nans = self.value_to_replace_nans.get(
                var_to_clean,
                self.value_to_replace_nans.get(
                    var_to_clean[:-2], self.value_to_replace_nans.get(var_to_clean[:-3])
                ),
            )
            self.logger.debug(
                f"Replacing NaNs for variable: {var_to_clean} with value: {var_value_to_replace_nans}"
            )
            cleaned_var = self.check_nans(
                data=var_to_clean_values[:, not_nan_positions],
                replace_value=var_value_to_replace_nans,
            )
            cleaned_vars_to_stack.append(cleaned_var)
            self.not_nan_positions[var_to_clean] = not_nan_positions

        stacked_data_matrix = np.hstack(
            [cleaned_var for cleaned_var in cleaned_vars_to_stack]
        )
        self.logger.info(
            f"Data matrix generated successfully with shape: {stacked_data_matrix.shape}"
        )

        return stacked_data_matrix

    def _preprocess_data(
        self, data: xr.Dataset, is_fit: bool = True, scale_data: bool = True
    ) -> np.ndarray:
        """
        Preprocess data for PCA. Steps:
        - Add windows in PCA dimension for rows.
        - Generate stacked data matrix.
        - Standarize data matrix.

        Parameters
        ----------
        data : xr.Dataset
            The data to preprocess.
        is_fit : bool, optional
            If True, set the data. Default is True.
        scale_data : bool, optional
            If True, scale the data. Default is True.

        Returns
        -------
        np.ndarray
            The standarized stacked data matrix.
        """

        window_processed_data = data.copy()
        if self.windows_in_pca_dim_for_rows is not None:
            self.logger.info("Adding windows in PCA dimension for rows")
            for variable, windows in self.windows_in_pca_dim_for_rows.items():
                self.logger.info(f"Adding windows: {windows} for variable: {variable}")
                for window in windows:
                    window_processed_data[f"{variable}_{window}"] = (
                        window_processed_data[variable].shift(
                            {self.pca_dim_for_rows: window}
                        )
                    )
            self.window_stacked_vars = list(window_processed_data.data_vars)

        self.logger.info("Generating stacked data matrix")
        stacked_data_matrix = self._generate_stacked_data(
            data=window_processed_data,
        )

        if scale_data:
            self.logger.info("Standarizing data matrix")
            standarized_stacked_data_matrix, scaler = self.standarize(
                data=stacked_data_matrix,
                scaler=self.scaler if not is_fit else None,
                transform=not is_fit,
            )
        else:
            self.logger.warning("Data is not standarized")
            standarized_stacked_data_matrix = stacked_data_matrix.copy()
            scaler = None

        self.logger.info("Data preprocessed successfully")

        if is_fit:
            self._data = data.copy()
            self._window_processed_data = window_processed_data.copy()
            self.coords_values = {
                coord: data[coord].values for coord in self.coords_to_stack
            }
            self._stacked_data_matrix = stacked_data_matrix.copy()
            self._standarized_stacked_data_matrix = (
                standarized_stacked_data_matrix.copy()
            )
            self.scaler = scaler

        return standarized_stacked_data_matrix

    def _reshape_EOFs(self, destandarize: bool = False) -> xr.Dataset:
        """
        Reshape EOFs to the original data shape.

        Parameters
        ----------
        destandarize : bool, optional
            If True, destandarize the EOFs. Default is True.

        Returns
        -------
        xr.Dataset
            The reshaped EOFs.
        """

        EOFs = self.pca.components_  # Get Empirical Orthogonal Functions (EOFs)

        if destandarize:
            if self.pcs is None:
                raise PCAError(
                    "No Principal Components (PCs) found. Please transform some data first."
                )
            else:
                # Inverse transform the EOFs using stds from the PCs
                EOFs = EOFs * self.pcs["stds"].values.reshape(-1, 1)

        # Create a full of nans array with shape time, vars * cols
        nan_EOFs = np.full(
            (
                self.pca.n_components_,
                self.num_cols_for_vars * len(self.window_stacked_vars),
            ),
            np.nan,
        )
        # Fill the nan_EOFs array with the EOFs values
        filled_EOFs = 0
        for iev, eof_var in enumerate(self.window_stacked_vars):
            eofs_to_fill = len(self.not_nan_positions[eof_var])
            nan_EOFs[
                :, self.not_nan_positions[eof_var] + (iev * self.num_cols_for_vars)
            ] = EOFs[:, filled_EOFs : filled_EOFs + eofs_to_fill]
            filled_EOFs += eofs_to_fill

        # Reshape the nan_EOFs array to the original data shape
        EOFs_reshaped_vars_arrays = np.array_split(
            nan_EOFs, len(self.window_stacked_vars), axis=1
        )
        coords_to_stack_shape = [self.pca.n_components_] + [
            len(self.coords_values[coord]) for coord in self.coords_to_stack
        ]
        EOFs_reshaped_vars_dict = {
            var: (
                ["n_component", *self.coords_to_stack],
                np.array(EOF_reshaped_var).reshape(*coords_to_stack_shape),
            )
            for var, EOF_reshaped_var in zip(
                self.window_stacked_vars, EOFs_reshaped_vars_arrays
            )
        }

        return xr.Dataset(
            EOFs_reshaped_vars_dict,
            coords={
                "n_component": np.arange(self.pca.n_components_),
                **{coord: self.coords_values[coord] for coord in self.coords_to_stack},
            },
        )

    def _reshape_data(self, X: np.ndarray, destandarize: bool = True) -> xr.Dataset:
        """
        Reshape data to the original data shape.

        Parameters
        ----------
        X : np.ndarray
            The data to reshape.
        destandarize : bool, optional
            If True, destandarize the data. Default is True.

        Returns
        -------
        xr.Dataset
            The reshaped data.
        """

        if destandarize and self.scaler is not None:
            X = self.scaler.inverse_transform(X)

        # Create a full of nans array with shape time, vars * cols
        nan_X = np.full(
            (
                X.shape[0],
                self.num_cols_for_vars * len(self.window_stacked_vars),
            ),
            np.nan,
        )
        # Fill the nan_X array with the X values
        filled_X = 0
        for iev, x_var in enumerate(self.window_stacked_vars):
            x_to_fill = len(self.not_nan_positions[x_var])
            nan_X[:, self.not_nan_positions[x_var] + (iev * self.num_cols_for_vars)] = (
                X[:, filled_X : filled_X + x_to_fill]
            )
            filled_X += x_to_fill

        # Reshape the nan_X array to the original data shape
        X_reshaped_vars_arrays = np.array_split(
            nan_X, len(self.window_stacked_vars), axis=1
        )
        coords_to_stack_shape = [X.shape[0]] + [
            len(self.coords_values[coord]) for coord in self.coords_to_stack
        ]
        X_reshaped_vars_dict = {
            var: (
                [self.pca_dim_for_rows, *self.coords_to_stack],
                np.array(X_reshaped_var).reshape(*coords_to_stack_shape),
            )
            for var, X_reshaped_var in zip(
                self.window_stacked_vars, X_reshaped_vars_arrays
            )
        }

        return X_reshaped_vars_dict


[docs]
    @validate_data_pca
    def fit(
        self,
        data: xr.Dataset,
        vars_to_stack: List[str],
        coords_to_stack: List[str],
        pca_dim_for_rows: str,
        windows_in_pca_dim_for_rows: dict = {},
        value_to_replace_nans: dict = {},
        nan_threshold_to_drop: dict = {},
        scale_data: bool = True,
    ) -> None:
        """
        Fit PCA model to data.

        Parameters
        ----------
        data : xr.Dataset
            The data to fit the PCA model.
        vars_to_stack : list of str
            The variables to stack.
        coords_to_stack : list of str
            The coordinates to stack.
        pca_dim_for_rows : str
            The PCA dimension to maintain in rows (usually the time).
        windows_in_pca_dim_for_rows : dict, optional
            The window steps to roll the pca_dim_for_rows for each variable. Default is {}.
        value_to_replace_nans : dict, optional
            The value to replace NaNs for each variable. Default is {}.
        nan_threshold_to_drop : dict, optional
            The threshold percentage to drop NaNs for each variable.
            By default, variables with less than 90% of valid values are dropped, which
            corresponds to {'ALL_vars': 0.9}.
            To for example use all available data for variable 'wind', you must provide
            nan_threshold_to_drop: {'wind': 1e-9}.
            Default is {}.
        scale_data : bool, optional
            If True, scale the data. Default is True.

        Notes
        -----
        For both value_to_replace_nans and nan_threshold_to_drop, the keys are the variables,
        and the suffixes for the windows are considered.
        Example: if you have variable "X", and apply windows [1, 2, 3], you can use "X_1", "X_2", "X_3".
        Nevertheless, you can also use the original variable name "X" to apply the same value for all windows.
        """

        self.vars_to_stack = vars_to_stack.copy()
        self.coords_to_stack = coords_to_stack.copy()
        self.pca_dim_for_rows = pca_dim_for_rows
        self.windows_in_pca_dim_for_rows = windows_in_pca_dim_for_rows.copy()
        self.value_to_replace_nans = value_to_replace_nans.copy()
        self.nan_threshold_to_drop = nan_threshold_to_drop.copy()

        self._preprocess_data(
            data=data[self.vars_to_stack], is_fit=True, scale_data=scale_data
        )
        self.logger.info("Fitting PCA model")
        self.pca.fit(X=self.standarized_stacked_data_matrix)
        self.is_fitted = True
        self.logger.info("PCA model fitted successfully")



[docs]
    def transform(self, data: xr.Dataset, after_fitting: bool = False) -> xr.Dataset:
        """
        Transform data using the fitted PCA model.

        Parameters
        ----------
        data : xr.Dataset
            The data to transform.
        after_fitting : bool, optional
            If True, use the already processed data. Default is False.
            This is just used in the fit_transform method!

        Returns
        -------
        xr.Dataset
            The transformed data.
        """

        if self.is_fitted is False:
            raise PCAError("PCA model must be fitted before transforming data")

        if not after_fitting:
            self.logger.info("Transforming data using PCA model")
            processed_data = self._preprocess_data(
                data=data[self.vars_to_stack],
                is_fit=False,
                scale_data=self.scaler is not None,
            )
        else:
            processed_data = self.standarized_stacked_data_matrix.copy()

        transformed_data = self.pca.transform(X=processed_data)

        # Save the Principal Components (PCs) in an xr.Dataset
        pcs = xr.Dataset(
            {
                "PCs": ((self.pca_dim_for_rows, "n_component"), transformed_data),
                "stds": (("n_component",), np.std(transformed_data, axis=0)),
            },
            coords={
                self.pca_dim_for_rows: data[self.pca_dim_for_rows],
                "n_component": np.arange(self.pca.n_components_),
            },
        )
        if after_fitting:
            self.pcs = pcs.copy()

        return pcs



[docs]
    def fit_transform(
        self,
        data: xr.Dataset,
        vars_to_stack: List[str],
        coords_to_stack: List[str],
        pca_dim_for_rows: str,
        windows_in_pca_dim_for_rows: dict = {},
        value_to_replace_nans: dict = {},
        nan_threshold_to_drop: dict = {},
        scale_data: bool = True,
    ) -> xr.Dataset:
        """
        Fit and transform data using PCA model.

        Parameters
        ----------
        data : xr.Dataset
            The data to fit the PCA model.
        vars_to_stack : list of str
            The variables to stack.
        coords_to_stack : list of str
            The coordinates to stack.
        pca_dim_for_rows : str
            The PCA dimension to maintain in rows (usually the time).
        windows_in_pca_dim_for_rows : dict, optional
            The window steps to roll the pca_dim_for_rows for each variable. Default is {}.
        value_to_replace_nans : dict, optional
            The value to replace NaNs for each variable. Default is {}.
        nan_threshold_to_drop : dict, optional
            The threshold percentage to drop NaNs for each variable.
            By default, variables with less than 90% of valid values are dropped, which
            corresponds to {'ALL_vars': 0.9}.
            To for example use all available data for variable 'wind', you must provide
            nan_threshold_to_drop: {'wind': 1e-9}.
            Default is {}.
        scale_data : bool, optional
            If True, scale the data. Default is True.

        Returns
        -------
        xr.Dataset
            The transformed data representing the Principal Components (PCs).

        Notes
        -----
        For both value_to_replace_nans and nan_threshold_to_drop, the keys are the variables,
        and the suffixes for the windows are considered.
        Example: if you have variable "X", and apply windows [1, 2, 3], you can use "X_1", "X_2", "X_3".
        Nevertheless, you can also use the original variable name "X" to apply the same value for all windows.
        """

        self.fit(
            data=data,
            vars_to_stack=vars_to_stack,
            coords_to_stack=coords_to_stack,
            pca_dim_for_rows=pca_dim_for_rows,
            windows_in_pca_dim_for_rows=windows_in_pca_dim_for_rows,
            value_to_replace_nans=value_to_replace_nans,
            nan_threshold_to_drop=nan_threshold_to_drop,
            scale_data=scale_data,
        )

        return self.transform(data=data, after_fitting=True)



[docs]
    def inverse_transform(self, PCs: Union[xr.DataArray, xr.Dataset]) -> xr.Dataset:
        """
        Inverse transform data using the fitted PCA model.

        Parameters
        ----------
        PCs : Union[xr.DataArray, xr.Dataset]
            The data to inverse transform. It should be the Principal Components (PCs).

        Returns
        -------
        xr.Dataset
            The inverse transformed data.
        """

        if self.is_fitted is False:
            raise PCAError("PCA model must be fitted before inverse transforming data")

        if isinstance(PCs, xr.Dataset):
            X = PCs["PCs"].values
        elif isinstance(PCs, xr.DataArray):
            X = PCs.values

        self.logger.info("Inverse transforming data using PCA model")
        X_transformed = self.pca.inverse_transform(X=X)
        data_reshaped_vars_dict = self._reshape_data(X=X_transformed, destandarize=True)

        # Create xarray Dataset with the transformed data
        data_transformed = xr.Dataset(
            data_reshaped_vars_dict,
            coords={
                self.pca_dim_for_rows: PCs[self.pca_dim_for_rows].values,
                **{coord: self.coords_values[coord] for coord in self.coords_to_stack},
            },
        )

        return data_transformed



[docs]
    def plot_pcs(self, num_pcs: int, pcs: xr.Dataset = None) -> None:
        """
        Plot the Principal Components (PCs).

        Parameters
        ----------
        num_pcs : int
            The number of Principal Components (PCs) to plot.
        pcs : xr.Dataset, optional
            The Principal Components (PCs) to plot.
        """

        if pcs is None:
            if self.pcs is None:
                raise PCAError(
                    "No Principal Components (PCs) found. Please transform some data first."
                )
            self.logger.info("Using the Principal Components (PCs) from the class")
            pcs = self.pcs.copy()

        _ = (
            pcs["PCs"]
            .isel(n_component=slice(0, num_pcs))
            .plot.line(
                x=self.pca_dim_for_rows,
                hue="n_component",
            )
        )



[docs]
    def plot_eofs(
        self,
        vars_to_plot: List[str],
        num_eofs: int,
        destandarize: bool = False,
        map_center: tuple = None,
    ) -> None:
        """
        Plot the Empirical Orthogonal Functions (EOFs).

        Parameters
        ----------
        vars_to_plot : List[str]
            The variables to plot.
        num_eofs : int
            The number of EOFs to plot.
        destandarize : bool, optional
            If True, destandarize the EOFs. Default is False.
        map_center : tuple, optional
            The center of the map. Default is None.
            First value is the longitude (-180, 180), and the second value is the latitude (-90, 90).
        """

        if self.is_fitted is False:
            raise PCAError("PCA model must be fitted before plotting EOFs.")

        eofs = self._reshape_EOFs(destandarize=destandarize).isel(
            n_component=slice(0, num_eofs)
        )

        for var in vars_to_plot:
            if map_center:
                p_var = eofs[var].plot(
                    col="n_component",
                    col_wrap=3,
                    transform=ccrs.PlateCarree(),
                    subplot_kws={"projection": ccrs.Orthographic(*map_center)},
                )
                for i, ax in enumerate(p_var.axes.flat):
                    ax.coastlines()
                    ax.gridlines()
                    # ax.set_global()
                    # ax.stock_img()
                    ax.set_title(f"EOF {i + 1}")
            else:
                p_var = eofs[var].plot(
                    col="n_component",
                    col_wrap=3,
                )
                for i, ax in enumerate(p_var.axes.flat):
                    ax.set_title(f"EOF {i + 1}")