Source code for gemseo.post.opt_history_view

# Copyright 2021 IRT Saint Exupéry, https://www.irt-saintexupery.com
#
# This program is free software; you can redistribute it and/or
# modify it under the terms of the GNU Lesser General Public
# License version 3 as published by the Free Software Foundation.
#
# This program is distributed in the hope that it will be useful,
# but WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
# Lesser General Public License for more details.
#
# You should have received a copy of the GNU Lesser General Public License
# along with this program; if not, write to the Free Software Foundation,
# Inc., 51 Franklin Street, Fifth Floor, Boston, MA  02110-1301, USA.
# Contributors:
#    INITIAL AUTHORS - API and implementation and/or documentation
#        :author: Francois Gallard
#        :author: Damien Guenot
#        :author: Charlie Vanaret
#    OTHER AUTHORS   - MACROSCOPIC CHANGES
"""Plot the history of the design variables, objective and constraints."""

from __future__ import annotations

import logging
from typing import TYPE_CHECKING
from typing import ClassVar
from typing import Final

from matplotlib import pyplot as plt
from matplotlib.colors import SymLogNorm
from matplotlib.ticker import LogFormatterSciNotation
from matplotlib.ticker import MaxNLocator
from matplotlib.ticker import SymmetricalLogLocator
from numpy import abs as np_abs
from numpy import arange
from numpy import argmin
from numpy import array
from numpy import atleast_1d
from numpy import atleast_2d
from numpy import isnan
from numpy import max as np_max
from numpy import min as np_min
from numpy import vstack
from numpy.linalg import norm

from gemseo.core.mdo_functions.mdo_function import MDOFunction
from gemseo.post.base_post import BasePost
from gemseo.post.core.colormaps import PARULA
from gemseo.post.core.colormaps import RG_SEISMIC
from gemseo.post.opt_history_view_settings import OptHistoryView_Settings
from gemseo.utils.string_tools import repr_variable

if TYPE_CHECKING:
    from collections.abc import Iterable
    from collections.abc import MutableSequence
    from collections.abc import Sequence

    from matplotlib.colors import ListedColormap
    from matplotlib.figure import Figure
    from numpy import ndarray

    from gemseo.typing import NumberArray
    from gemseo.typing import RealArray

LOGGER = logging.getLogger(__name__)



[docs]
class OptHistoryView(BasePost[OptHistoryView_Settings]):
    """Plot the history of the design variables, objective and constraints.

    This post-processing generates one plot for the design variables, one plot for the
    Euclidean distance to the optimal design vector, one plot for the objective, one
    plot for the equality constraints (if any) and one plot for the inequality
    constraints (if any).
    """

    Settings: ClassVar[type[OptHistoryView_Settings]] = OptHistoryView_Settings

    x_label: ClassVar[str] = "Iterations"
    """The label for the x-axis."""

    __TICK_LABEL_SIZE: Final[int] = 9
    """The font size of the tick labels."""

    __AXIS_LABEL_SIZE: Final[int] = 12
    """The font size of the axis labels."""

    __X_MARGIN: Final[float] = 0.1
    """The left and right margin for the x-axis."""

    __Y_MARGIN: Final[float] = 0.05
    """The left and right margin for the y-axis."""

    __CMAP: Final[ListedColormap] = PARULA
    __INEQ_CSTR_CMAP: Final[ListedColormap] = RG_SEISMIC
    __EQ_CSTR_CMAP: Final[str] = "seismic"

    def _plot(self, settings: OptHistoryView_Settings) -> None:
        variable_names = settings.variable_names

        obj_history, x_history, n_iter, x_history_to_display = self._get_history(
            self._optimization_metadata.standardized_objective_name, variable_names
        )
        normalize = self._dataset.misc["input_space"].normalize_vect
        opt_design = self._dataset.design_dataset.loc[
            self._optimization_metadata.optimum_iteration or 1
        ].to_numpy()
        x_xstar = norm(normalize(x_history) - normalize(opt_design), axis=1)

        self._create_variables_plot(
            x_history_to_display, variable_names, settings.fig_size, x_xstar
        )

        self._create_obj_plot(
            atleast_1d(obj_history),
            n_iter,
            settings.fig_size,
            x_xstar,
            obj_min=settings.obj_min,
            obj_max=settings.obj_max,
            obj_relative=settings.obj_relative,
        )

        self._create_x_star_plot(x_history, n_iter, settings.fig_size)

        for constraints, constraint_type in [
            (
                self._dataset.inequality_constraint_names,
                MDOFunction.ConstraintType.INEQ,
            ),
            (
                self._dataset.equality_constraint_names,
                MDOFunction.ConstraintType.EQ,
            ),
        ]:
            if constraints:
                constraint_names = constraints
                self._create_cstr_plot(
                    self.__get_constraint_history(constraint_names),
                    constraint_type,
                    constraint_names,
                    settings.fig_size,
                    x_xstar,
                )

    def _get_history(
        self,
        function_name: str,
        variable_names: Iterable[str],
    ) -> tuple[RealArray, RealArray, int, RealArray]:
        """Access the optimization history of a function and the design variables.

        Args:
            function_name: The name of the function.
            variable_names: The names of the variables to display.
                If empty, use all design variables.

        Returns:
            The history of the function outputs,
            the history of the design variables,
            the number of iterations and
            the history of the design variables to display.
        """
        dataset = self._dataset
        f_hist = dataset.get_view(variable_names=function_name).to_numpy().squeeze()
        x_hist = dataset.design_dataset.to_numpy(dtype=float)
        f_hist = array(f_hist).real
        complete_x_hist = array(x_hist).real

        x_hist_to_display = complete_x_hist
        if variable_names:
            indices = [
                index
                for name in variable_names
                for index in self._dataset.misc["input_space"].names_to_indices[name]
            ]
            x_hist_to_display = complete_x_hist[:, indices]

        return f_hist, complete_x_hist, complete_x_hist.shape[0], x_hist_to_display

    def __get_constraint_history(
        self, constraint_names: MutableSequence[str]
    ) -> list[ndarray]:
        """Extract the history of constraints.

        Args:
            constraint_names: The names of the constraints.

        Returns:
            The history of the constraints.
        """
        available_data_names = self._dataset.variable_names
        for constraint_name in tuple(constraint_names):
            if constraint_name not in available_data_names:
                constraint_names.remove(constraint_name)

        constraints_history = []
        for constraint_name in constraint_names:
            constraint_history = (
                self._dataset.get_view(variable_names=constraint_name).to_numpy().real
            )
            constraints_history.append(constraint_history)

        return constraints_history

    def _create_variables_plot(
        self,
        x_history: RealArray,
        variable_names: Iterable[str],
        fig_size: tuple[float, float],
        x_xstar: RealArray,
    ) -> None:
        """Create the design variables plot.

        Args:
            x_history: The history for the design variables.
            variable_names: The names of the variables to display.
                If empty, use all design variables.
            x_xstar: The distance between the designs and the optimum design.
        """
        n_iterations = len(x_history)
        if n_iterations < 2:
            return

        design_space = self._dataset.misc["input_space"]
        lower_bounds = design_space.get_lower_bounds(variable_names)
        upper_bounds = design_space.get_upper_bounds(variable_names)
        norm_x_history = (x_history - lower_bounds) / (upper_bounds - lower_bounds)

        fig, ax1 = plt.subplots(1, 1, figsize=fig_size)

        # design variables
        im1 = ax1.imshow(
            norm_x_history.T,
            cmap=self.__CMAP,
            interpolation="nearest",
            vmin=0.0,
            vmax=1.0,
            aspect="auto",
        )
        ax1.axvline(x=argmin(x_xstar), color="r", label="Optimum")
        ax1.legend()
        ax1.set_yticks(arange(x_history.shape[1]))
        ax1.set_yticklabels(self._get_design_variable_names(variable_names, True))
        ax1.set_xlabel(self.x_label, fontsize=self.__AXIS_LABEL_SIZE)
        # ax1.invert_yaxis()

        ax1.set_title("Evolution of the optimization variables")
        ax1.set_xticks(range(n_iterations))
        ax1.set_xticklabels(map(str, (range(1, n_iterations + 1))))
        ax1.get_xaxis().set_major_locator(MaxNLocator(integer=True))

        # colorbar
        fig.colorbar(im1)

        # Set window size
        mng = plt.get_current_fig_manager()
        assert mng is not None
        mng.resize(700, 1000)

        self._add_figure(fig, "variables")

    def _create_obj_plot(
        self,
        obj_history: RealArray,
        n_iter: int,
        fig_size: tuple[float, float],
        x_xstar: RealArray,
        obj_min: float | None = None,
        obj_max: float | None = None,
        obj_relative: bool = False,
    ) -> None:
        """Creates the design variables plot.

        Args:
            obj_history: The history of the objective function.
            n_iter: The number of iterations.
            obj_max: The maximum value for the objective in the plot.
                If ``None``, use the maximum value of the objective history.
            obj_min: The minimum value for the objective in the plot.
                If ``None``, use the minimum value of the objective history.
            obj_relative: If ``True``, plot the objective value difference
                with the initial value.
            x_xstar: The distance between the designs and the optimum design.
        """
        if self._change_obj:
            obj_history = -obj_history

        if obj_relative:
            LOGGER.info(
                "Plot of optimization history "
                "with relative variation compared to "
                "initial point objective value = %s",
                obj_history[0],
            )
            obj_history -= obj_history[0]

        # Remove nans
        n_iterations = len(obj_history)
        x_absc = arange(n_iterations)
        idx_nan = isnan(obj_history)
        assert idx_nan is not None

        if idx_nan.size > 0:
            obj_history = obj_history[~idx_nan]
            x_absc_nan = x_absc[idx_nan]
            x_absc_not_nan = x_absc[~idx_nan]

        fmin = np_min(obj_history)
        fmax = np_max(obj_history)

        fig = plt.figure(figsize=fig_size)
        # objective function
        plt.xlabel(self.x_label, fontsize=self.__AXIS_LABEL_SIZE)
        plt.ylabel("Objective value", fontsize=self.__AXIS_LABEL_SIZE)
        plt.plot(x_absc_not_nan, obj_history)
        plt.axvline(x=argmin(x_xstar), color="r", label="Optimum")
        plt.legend()

        if idx_nan.size > 0:
            for x_i in x_absc_nan:
                plt.axvline(x_i, color="purple")

        if obj_min is not None and obj_min < fmin:
            fmin = obj_min
        if obj_max is not None and obj_max > fmax:
            fmax = obj_max

        margin = (fmax - fmin) * self.__Y_MARGIN
        plt.ylim([fmin - margin, fmax + margin])
        plt.xlim([0 - self.__X_MARGIN, n_iter - 1 + self.__X_MARGIN])
        ax1 = fig.gca()
        ax1.set_xticks(x_absc)
        ax1.set_xticklabels((x_absc + 1).tolist())
        ax1.get_xaxis().set_major_locator(MaxNLocator(integer=True))
        plt.grid(True)
        plt.title("Evolution of the objective value")

        # Set window size
        mng = plt.get_current_fig_manager()
        assert mng is not None
        mng.resize(700, 1000)

        self._add_figure(fig, "objective")

    def _create_x_star_plot(
        self,
        x_history: RealArray,
        n_iter: int,
        fig_size: tuple[float, float],
    ) -> None:
        """Create the design variables plot.

        Args:
            x_history: The history of the design variables.
            n_iter: The number of iterations.
        """
        fig = plt.figure(figsize=fig_size)
        plt.xlabel(self.x_label, fontsize=self.__AXIS_LABEL_SIZE)
        plt.ylabel("||x-x*||", fontsize=self.__AXIS_LABEL_SIZE)
        normalize = self._dataset.misc["input_space"].normalize_vect
        opt_design = self._dataset.design_dataset.loc[
            self._optimization_metadata.optimum_iteration or 1
        ].to_numpy(dtype=float)
        x_xstar = norm(
            normalize(x_history) - normalize(opt_design),
            axis=1,
        )

        # Draw a vertical line at the optimum
        n_iterations = len(x_history)
        plt.axvline(x=float(argmin(x_xstar)), color="r", label="Optimum")
        plt.legend()
        plt.semilogy(arange(n_iterations), x_xstar)
        plt.legend()
        # ======================================================================
        # try:
        #     plt.semilogy(np.arange(len(x_xstar)), x_xstar)
        # except ValueError:
        #     LOGGER.warning("Cannot use log scale for x_star plot since" +
        #                    "all values are not positive !")
        # ======================================================================
        ax1 = fig.gca()
        ax1.set_xticks(range(n_iterations))
        ax1.set_xticklabels(map(str, range(1, n_iterations + 1)))
        ax1.get_xaxis().set_major_locator(MaxNLocator(integer=True))
        plt.grid(True)
        plt.title("Evolution of the distance to the optimum")
        plt.xlim([0 - self.__X_MARGIN, n_iter - 1 + self.__X_MARGIN])

        # Set window size
        mng = plt.get_current_fig_manager()
        assert mng is not None
        mng.resize(700, 1000)

        self._add_figure(fig, "x_xstar")

    @staticmethod
    def _cstr_number(constraint_history: Iterable[RealArray]) -> int:
        """Compute the total scalar constraints number.

        Args:
            constraint_history: The history of the constraints.

        Returns:
            The number of constraints.
        """
        n_cstr = 0
        for constraint_history_i in constraint_history:
            c_hist_loc = atleast_2d(constraint_history_i).T
            if c_hist_loc.shape[1] == 1:
                c_hist_loc = c_hist_loc.T
            n_cstr += c_hist_loc.shape[0]
        LOGGER.debug("Total constraints number =%s", n_cstr)
        return n_cstr

    def _create_cstr_plot(
        self,
        cstr_history: Iterable[RealArray],
        cstr_type: MDOFunction.ConstraintType,
        cstr_names: Sequence[str],
        fig_size: tuple[float, float],
        x_xstar: RealArray,
    ) -> None:
        """Create the constraints plot: 1 line per constraint component.

        Args:
            cstr_history: The history of the constraints.
            cstr_type: The type of the constraints.
            cstr_names: The names of the constraints.
            x_xstar: The distance between the designs and the optimum design.
        """
        n_cstr = self._cstr_number(cstr_history)
        if n_cstr == 0:
            return

        # matrix of all constraints' values
        cstr_matrix = None
        vmax = 0.0
        cstr_labels = []

        max_iter = 0
        for cstr_history_i in cstr_history:
            history_i = atleast_2d(cstr_history_i).T
            if history_i.shape[1] == 1:
                history_i = history_i.T

            max_iter = max(max_iter, history_i.shape[1])

        for i, cstr_history_i in enumerate(cstr_history):
            history_i = atleast_2d(cstr_history_i).T
            if history_i.shape[1] == 1:
                history_i = history_i.T

            nb_components = history_i.shape[0]

            if history_i.shape[1] == max_iter:  # TEST
                for component_j in range(nb_components):
                    # compute the label of the constraint
                    if component_j == 0:
                        cstr_label = repr_variable(
                            cstr_names[i], component_j, nb_components
                        )
                    else:
                        cstr_label = repr_variable("", component_j)

                    cstr_labels.append(cstr_label)
                    history_i_j = atleast_2d(history_i[component_j, :])

                    # max value
                    notnans = ~isnan(history_i_j)
                    vmax = max(vmax, np_max(np_abs(history_i_j[notnans])))

                    # build the constraint matrix
                    if cstr_matrix is None:
                        cstr_matrix = history_i_j
                    else:
                        cstr_matrix = vstack((cstr_matrix, history_i_j))

        fig = self._build_cstr_fig(
            cstr_matrix, cstr_type, vmax, n_cstr, cstr_labels, fig_size, x_xstar
        )

        self._add_figure(fig, f"{cstr_type}_constraints")

    def _build_cstr_fig(
        self,
        cstr_matrix: NumberArray,
        cstr_type: MDOFunction.ConstraintType,
        vmax: float,
        n_cstr: int,
        cstr_labels: Sequence[str],
        fig_size: tuple[float, float],
        x_xstar: RealArray,
    ) -> Figure:
        """Build the constraints figure.

        Args:
            cstr_matrix: The matrix of constraints values.
            cstr_type: The type of the constraints.
            cstr_labels: The labels for the constraints.
            vmax: The maximum constraint absolute value.
            n_cstr: The number of constraints.
            cstr_labels: The labels of constraints names.
            x_xstar: The distance between the designs and the optimum design.

        Returns:
            The constraints figure.
        """
        if cstr_matrix.shape[0] == len(x_xstar):
            cstr_matrix = cstr_matrix.T
        cmap: str | ListedColormap
        if cstr_type == MDOFunction.ConstraintType.EQ:
            cmap = self.__EQ_CSTR_CMAP
            constraint_type = "equality"
        else:
            cmap = self.__INEQ_CSTR_CMAP
            constraint_type = "inequality"

        idx_nan = isnan(cstr_matrix)
        hasnan = idx_nan.any()
        if hasnan > 0:
            cstr_matrix[idx_nan] = 0.0

        # generation of the image
        fig, ax1 = plt.subplots(1, 1, figsize=fig_size)
        im1 = ax1.imshow(
            cstr_matrix,
            cmap=cmap,
            interpolation="nearest",
            aspect="auto",
            norm=SymLogNorm(vmin=-vmax, vmax=vmax, linthresh=1.0),
        )
        ax1.axvline(x=argmin(x_xstar), color="r", label="Optimum")
        if hasnan > 0:
            x_absc_nan = idx_nan.any(axis=0).nonzero()[0]
            for x_i in x_absc_nan:
                plt.axvline(x_i, color="purple")

        ax1.tick_params(labelsize=self.__TICK_LABEL_SIZE)
        ax1.set_yticks(list(range(n_cstr)))
        ax1.set_yticklabels(cstr_labels)

        ax1.set_xlabel(self.x_label, fontsize=self.__AXIS_LABEL_SIZE)
        ax1.set_title(f"Evolution of the {constraint_type} constraints")
        n_iterations = len(self._dataset)
        ax1.set_xticks(range(n_iterations))
        ax1.set_xticklabels(map(str, range(1, n_iterations + 1)))

        ax1.hlines(
            list(range(len(cstr_matrix))),
            [-0.5],
            [len(cstr_matrix[0]) - 0.5],
            alpha=0.1,
            lw=0.5,
        )
        ax1.get_xaxis().set_major_locator(MaxNLocator(integer=True))

        col_bar = fig.colorbar(
            im1,
            ticks=SymmetricalLogLocator(linthresh=1.0, base=10),
            format=LogFormatterSciNotation(),
        )
        col_bar.ax.tick_params(labelsize=self.__TICK_LABEL_SIZE)

        fig.tight_layout()
        mng = plt.get_current_fig_manager()
        # mng.full_screen_toggle()
        assert mng is not None
        mng.resize(700, 1000)
        return fig