Source code for customhys.hyperheuristic

"""
This module contains the Hyperheuristic class.

Created on Thu Jan  9 15:36:43 2020

@author: Jorge Mario Cruz-Duarte (jcrvz.github.io), e-mail: j.m.cruzduarte@ieee.org
"""

import json
import os
import random
from datetime import datetime
from os import makedirs as _create_path
from os.path import exists as _check_path

import numpy as np
import scipy.stats as st

from . import operators as op
from . import tools as jt
from .metaheuristic import Metaheuristic

_using_tensorflow = False
try:
    from os import environ as _environ

    import tensorflow as tf

    from .machine_learning import DatasetSequences, ModelPredictor

    # Remove Tensorflow warnings
    _environ["TF_CPP_MIN_LOG_LEVEL"] = "3"
    tf.get_logger().setLevel("ERROR")
    _using_tensorflow = True

except ImportError:
    import warnings as wa

    message = "`Tensorflow` not found! Please, install it to use the machine_learning module"
    wa.showwarning(message, ImportWarning, "hyperheuristic.py", 23)



[docs]
class Hyperheuristic:
    """
    This is the Hyperheuristic class, each object corresponds to a hyper-heuristic process implemented with a heuristic
    collection from Operators to build metaheuristics using the Metaheuristic module.
    """

    _VALID_INITIAL_SCHEMES = {
        "random",
        "vertex",
        "sobol",
        "halton",
        "beta",
        "normal",
        "lognormal",
        "exponential",
        "rayleigh",
        "weibull",
        "lhs",
    }


[docs]
    def __init__(self, heuristic_space="default.txt", problem=None, parameters=None, file_label="", weights_array=None):
        """
        Create a hyper-heuristic process using a operator collection as heuristic space.

        :param str heuristic_space: Optional.
            The heuristic space or search space collection. It could be a string indicating the file name, assuming it
            is located in the folder ``./collections/``, or a list with tuples (check the default collection
            ``./collections/default.txt'``) just like ``operators.build_operators`` generates. The default is
            'default.txt'.
        :param dict problem:
            This is a dictionary containing the 'function' that maps a 1-by-D array of real values to a real value,
            'is_constrained' flag that indicates the solution is inside the search space, and the 'boundaries' (a tuple
            with two lists of size D). These two lists correspond to the lower and upper limits of domain, such as:
            ``boundaries = (lower_boundaries, upper_boundaries)``

            **Note:** Dimensions (D) of search domain are read from these boundaries. The problem can be obtained from
            the ``benchmark_func`` module.
        :param dict parameters:
            Parameters to implement the hyper-heuristic procedure, the following fields must be provided: 'cardinality',
            'num_iterations', 'num_agents', 'num_replicas', 'num_steps', 'stagnation_percentage', 'max_temperature', and
            'cooling_rate'. The default is showing next:
                parameters = {cardinality=3,                # Max. numb. of SOs in MHs, lvl:1
                              num_iterations=100,           # Iterations a MH performs, lvl:1
                              num_agents=30,                # Agents in population,     lvl:1
                              num_replicas=50,              # Replicas per each MH,     lvl:2
                              num_steps=100,                # Trials per HH step,       lvl:2
                              stagnation_percentage=0.3,    # Stagnation percentage,    lvl:2
                              max_temperature=200,          # Initial temperature (SA), lvl:2
                              cooling_rate=0.05}            # Cooling rate (SA),        lvl:2

            **Note:** Level (lvl) flag corresponds to the heuristic level of the parameter. lvl:1 concerns to mid-level
            heuristics like metaheuristics, and lvl:2 to high-level heuristics like hyper-heuristics.
        :param str file_label: Optional.
            Tag or label for saving files. The default is ''.
        :param numpy.array weights_array: Optional.
            Weights of the search operators, if there is a-priori information about them. The default is None.
        """
        # Read the heuristic space
        if isinstance(heuristic_space, list):
            self.heuristic_space_label = "custom_list"
            self.heuristic_space = heuristic_space
        elif isinstance(heuristic_space, str):
            self.heuristic_space_label = heuristic_space[: heuristic_space.rfind(".")].split("_")[0]
            with open(os.path.join("collections", heuristic_space), encoding="utf-8") as operators_file:
                self.heuristic_space = [eval(line.rstrip("\n")) for line in operators_file]
        else:
            raise HyperheuristicError("Invalid heuristic_space")

        # Assign default values
        # TODO: Put default values -> .get('key', defaultVal)
        if not parameters:
            parameters = {
                "cardinality": 3,  # Max. numb. of SOs in MHs, lvl:1
                "cardinality_min": 1,  # Min. numb. of SOs in MHs, lvl:1
                "num_iterations": 100,  # Iterations a MH performs, lvl:1
                "num_agents": 30,  # Agents in population,     lvl:1
                "as_mh": False,  # HH sequence as a MH?,     lvl:2
                "num_replicas": 50,  # Replicas per each MH,     lvl:2
                "num_steps": 200,  # Trials per HH step,       lvl:2
                "stagnation_percentage": 0.37,  # Stagnation percentage,    lvl:2
                "max_temperature": 1,  # Initial temperature (SA), lvl:2
                "min_temperature": 1e-6,  # Min temperature (SA),     lvl:2
                "cooling_rate": 1e-3,  # Cooling rate (SA),        lvl:2
                "temperature_scheme": "fast",  # Temperature updating (SA),lvl:2
                "acceptance_scheme": "exponential",  # Acceptance mode,          lvl:2
                "allow_weight_matrix": True,  # Weight matrix,            lvl:2
                "trial_overflow": False,  # Trial overflow policy,    lvl:2
                "learnt_dataset": None,  # If it is a learnt dataset related with the heuristic space
                "repeat_operators": True,  # Allow repeating SOs inSeq,lvl:2
                "verbose": True,  # Verbose process,          lvl:2
                "learning_portion": 0.37,  # Percent of seqs to learn  lvl:2
                "solver": "static",  # Indicate which solver use lvl:1
            }

        # Read the problem
        if problem:
            self.problem = problem
        else:
            raise HyperheuristicError("Problem must be provided")

        # Read the heuristic space size and create the active set
        self.num_operators = len(self.heuristic_space)
        self.current_space = np.arange(self.num_operators)

        # Read the weights (if it is entered)
        self.weights = weights_array
        self.weight_matrix = None
        self.transition_matrix = None

        # Initialise other parameters
        self.parameters = parameters
        self.file_label = file_label
        raw_initial_scheme = parameters.get("initial_scheme", parameters.get("intial_scheme", "random"))
        self.initial_scheme = self._select_initial_scheme(raw_initial_scheme)
        self.parameters["initial_scheme"] = self.initial_scheme

        self.max_cardinality = None
        self.min_cardinality = None
        self.num_iterations = None
        self.toggle_seq_as_meta(parameters["as_mh"])


    def _select_initial_scheme(self, initial_scheme):
        scheme = "random" if initial_scheme is None else str(initial_scheme).strip().lower()
        if scheme == "auto":
            scheme = random.choice(tuple(self._VALID_INITIAL_SCHEMES))

        if scheme not in self._VALID_INITIAL_SCHEMES:
            valid = ", ".join(sorted(self._VALID_INITIAL_SCHEMES))
            raise HyperheuristicError(f"Invalid initial_scheme '{initial_scheme}'. Valid values: {valid}")

        return scheme

    @property
    def initialization_operators(self):
        """Return a list of (index, op_tuple) for operators with role='initialize' in the heuristic space."""
        return [
            (i, op_tuple) for i, op_tuple in enumerate(self.heuristic_space) if op._get_role(op_tuple) == "initialize"
        ]


[docs]
    def toggle_seq_as_meta(self, as_mh=None):
        if as_mh is None:
            self.parameters["as_mh"] = not self.parameters["as_mh"]
            self.toggle_seq_as_meta(self.parameters["as_mh"])
        else:
            if as_mh:
                self.max_cardinality = self.parameters["cardinality"]
                self.min_cardinality = self.parameters["cardinality_min"]
                self.num_iterations = self.parameters["num_iterations"]
            else:
                self.max_cardinality = self.parameters["num_iterations"]
                self.min_cardinality = self.parameters["cardinality_min"]
                self.num_iterations = 1


    def _choose_action(self, current_cardinality, previous_action=None, available_options=None):
        # First read the available actions. Those can be ...
        if available_options is None:
            available_options = [
                "Add",
                "AddMany",
                "Remove",
                "RemoveMany",
                "Shift",
                "LocalShift",
                "Swap",
                "Restart",
                "Mirror",
                "Roll",
                "RollMany",
            ]
            # Allow changing the init operator when the space has at least 2 init operators
            if len(self.initialization_operators) >= 2:
                available_options.append("ChangeInitOperator")

        # Black list (to avoid repeating the some actions in a row)
        if previous_action:
            if (previous_action == "Mirror") and ("Mirror" in available_options):
                available_options.remove("Mirror")

        # Disregard those with respect to the current cardinality. It also considers the case of fixed cardinality
        if current_cardinality <= self.min_cardinality + 1:
            if "RemoveMany" in available_options:
                available_options.remove("RemoveMany")

            if (current_cardinality <= self.min_cardinality) and ("Remove" in available_options):
                available_options.remove("Remove")

        if current_cardinality <= 1:
            if "Swap" in available_options:
                available_options.remove("Swap")
            if "Mirror" in available_options:
                available_options.remove("Mirror")  # not an error, but to prevent wasting time

        if current_cardinality >= self.max_cardinality - 1:
            if "AddMany" in available_options:
                available_options.remove("AddMany")

            if (current_cardinality >= self.max_cardinality) and ("Add" in available_options):
                available_options.remove("Add")

        # Decide (randomly) which action to do
        return np.random.choice(available_options)

    @staticmethod
    def __get_argfrequencies(weights, top=5):
        return np.argsort(weights)[-top:]

    @staticmethod
    def __adjust_frequencies(weights, to_only=5):
        """
        This method adjust a ``weights`` vector to only having only the top ``to_only`` most relevant search operators. It
        is made based on the greatest frequency values.
        @param weights: np.ndarray.
            The weight vector to adjust.
        @param to_only: int. Optional.
            The number of the most relevant search operators to be considered in the adjustment.
        @return: np.ndarray.
            An array with the same properties of ``weights``.
        """
        new_weights = np.zeros(weights.shape)
        new_weights[np.argsort(weights)[-to_only:]] = 1 / to_only
        return new_weights

    def _obtain_candidate_solution(self, sol=None, action=None, operators_weights=None, top=None):
        """
        This method selects a new candidate solution for a given candidate solution ``sol``. To do so, it
        adds, deletes, or perturbate a randomly chosen operator index from the current sequence. If this sequence
        is None, the method returns a new 1-cardinality sequence at random.
        :param list|int sol: Optional.
            Sequence of heuristic indices (or encoded solution). If `sol` is an integer, it is assumed that this is
            the cardinality required for initial random sequence. The default is None, which means that there is no
            current sequence, so an initial one is required.
        :return: list.
        """
        # Create a new MH with min_cardinality from scratch by using a weights array (if so)
        # if action is given, it is assumed the way of obtaining this intial solution
        init_indices = [i for i, _ in self.initialization_operators]
        has_init_ops = len(init_indices) > 0

        if sol is None:
            if action == "max_frequency":
                # Each search operator per step corresponds to the most frequent one: uMH weight matrix is required
                # this option only works for transfer learning
                encoded_neighbour = [weights_per_step.argmax() for weights_per_step in operators_weights]

            else:
                initial_cardinality = (
                    self.min_cardinality
                    if self.parameters["as_mh"]
                    else (self.max_cardinality + self.min_cardinality) // 2
                )

                # When init operators exist, index 0 is reserved for one of them.
                # Keep at least one operator in the tail so a perturbation sequence can run.
                if has_init_ops:
                    initial_cardinality = max(initial_cardinality, 2)

                operators_weights = operators_weights if operators_weights else self.weights

                tail_size = initial_cardinality - 1 if has_init_ops else initial_cardinality
                encoded_neighbour = np.random.choice(
                    self.current_space if (operators_weights is None) else self.num_operators,
                    tail_size,
                    replace=self.parameters["repeat_operators"],
                    p=operators_weights,
                )

                if has_init_ops:
                    encoded_neighbour = np.concatenate(
                        ([np.random.choice(init_indices)], np.asarray(encoded_neighbour))
                    )

        # If sol is an integer, assume that it refers to the cardinality
        elif isinstance(sol, int):
            operators_weights = self.weights if operators_weights is None else operators_weights

            cardinality = max(sol, 2) if has_init_ops else sol
            tail_size = cardinality - 1 if has_init_ops else cardinality
            encoded_neighbour = np.random.choice(
                self.current_space if (operators_weights is None) else self.num_operators,
                tail_size,
                replace=self.parameters["repeat_operators"],
                p=operators_weights,
            )

            if has_init_ops:
                encoded_neighbour = np.concatenate(([np.random.choice(init_indices)], np.asarray(encoded_neighbour)))

        elif isinstance(sol, np.ndarray | list):
            # Bypass the current weights vector to highlight the ``top`` most relevant ones.
            if (operators_weights is not None) and (top is not None):
                operators_weights = self.__adjust_frequencies(operators_weights, to_only=top)

            sol = np.array(sol) if isinstance(sol, list) else sol
            current_cardinality = len(sol)

            # Choose (randomly) which action to do
            if not action:
                action = self._choose_action(current_cardinality)

            # Perform the corresponding action
            if (action == "Add") and (current_cardinality < self.max_cardinality):
                # Select an operator excluding the ones in the current solution
                selected_operator = np.random.choice(
                    np.setdiff1d(self.current_space, sol)
                    if not self.parameters["repeat_operators"]
                    else self.current_space
                )

                # Select where to add such an operator, since ``operator_location`` value represents:
                #       0 - left side of the first operator
                #       1 - right side of the first operator or left side of the second one,
                #       ..., and so forth.
                #
                #       | operator 1 | operator 2 | operator 3 |     ...      |  operator N  |
                #       0 <--------> 1 <--------> 2 <--------> 3 <-- ... --> N-1 <---------> N
                min_insert = 1 if has_init_ops else 0
                operator_location = np.random.randint(min_insert, current_cardinality + 1)

                # Add the selected operator
                encoded_neighbour = np.array((*sol[:operator_location], selected_operator, *sol[operator_location:]))

            elif (action == "AddMany") and (current_cardinality < self.max_cardinality - 1):
                encoded_neighbour = np.copy(sol)
                for _ in range(np.random.randint(1, self.max_cardinality - current_cardinality + 1)):
                    encoded_neighbour = self._obtain_candidate_solution(sol=encoded_neighbour, action="Add")

            elif action == "Remove":
                min_card = max(self.min_cardinality, 2) if has_init_ops else self.min_cardinality
                if current_cardinality > min_card:
                    remove_idx = (
                        np.random.randint(1, current_cardinality)
                        if has_init_ops
                        else np.random.randint(current_cardinality)
                    )
                    encoded_neighbour = np.delete(sol, remove_idx)
                else:
                    encoded_neighbour = np.copy(sol)

            elif action == "RemoveLast":
                min_card = max(self.min_cardinality, 2) if has_init_ops else self.min_cardinality
                if current_cardinality > min_card:
                    encoded_neighbour = np.delete(sol, -1)
                else:
                    encoded_neighbour = np.copy(sol)

            elif action == "RemoveMany":
                min_card = max(self.min_cardinality, 2) if has_init_ops else self.min_cardinality
                if current_cardinality > min_card + 1:
                    encoded_neighbour = np.copy(sol)
                    for _ in range(np.random.randint(1, current_cardinality - min_card + 1)):
                        encoded_neighbour = self._obtain_candidate_solution(sol=encoded_neighbour, action="Remove")
                else:
                    encoded_neighbour = np.copy(sol)

            elif action == "Shift":
                # Perturbate an operator randomly selected excluding the existing ones
                encoded_neighbour = np.copy(sol)
                shift_idx = (
                    np.random.randint(1, current_cardinality)
                    if has_init_ops
                    else np.random.randint(current_cardinality)
                )
                encoded_neighbour[shift_idx] = np.random.choice(
                    np.setdiff1d(self.current_space, sol)
                    if not self.parameters["repeat_operators"]
                    else self.num_operators
                )

            elif action == "ShiftMany":
                encoded_neighbour = np.copy(sol)
                for _ in range(np.random.randint(1, current_cardinality - self.min_cardinality + 1)):
                    encoded_neighbour = self._obtain_candidate_solution(sol=encoded_neighbour, action="Shift")

            elif action == "LocalShift":  # It only works with the full set
                # Perturbate an operator randomly selected +/- 1 excluding the existing ones
                encoded_neighbour = np.copy(sol)
                operator_location = (
                    np.random.randint(1, current_cardinality)
                    if has_init_ops
                    else np.random.randint(current_cardinality)
                )
                neighbour_direction = 1 if random.random() < 0.5 else -1  # +/- 1
                selected_operator = (encoded_neighbour[operator_location] + neighbour_direction) % self.num_operators

                # If repeat is true and the selected_operator is repeated, then apply +/- 1 until it is not repeated
                while (not self.parameters["repeat_operators"]) and (selected_operator in encoded_neighbour):
                    selected_operator = (selected_operator + neighbour_direction) % self.num_operators

                encoded_neighbour[operator_location] = selected_operator

            elif action == "LocalShiftMany":
                encoded_neighbour = np.copy(sol)
                for _ in range(np.random.randint(1, current_cardinality - self.min_cardinality + 1)):
                    encoded_neighbour = self._obtain_candidate_solution(sol=encoded_neighbour, action="LocalShift")

            elif (action == "Swap") and (current_cardinality > 1):
                # Swap two elements randomly chosen
                start_idx = 1 if has_init_ops else 0
                tail_len = current_cardinality - start_idx

                if tail_len <= 1:
                    encoded_neighbour = np.copy(sol)

                elif tail_len == 2:
                    encoded_neighbour = np.copy(sol)
                    encoded_neighbour[start_idx:] = encoded_neighbour[start_idx:][::-1]

                elif tail_len > 2:
                    encoded_neighbour = np.copy(sol)
                    ind1, ind2 = np.random.choice(np.arange(start_idx, current_cardinality), 2, replace=False)
                    encoded_neighbour[ind1], encoded_neighbour[ind2] = encoded_neighbour[ind2], encoded_neighbour[ind1]

                elif current_cardinality == 2:
                    encoded_neighbour = np.copy(sol)[::-1]

                elif current_cardinality > 2:
                    encoded_neighbour = np.copy(sol)
                    ind1, ind2 = np.random.choice(current_cardinality, 2, replace=False)
                    encoded_neighbour[ind1], encoded_neighbour[ind2] = encoded_neighbour[ind2], encoded_neighbour[ind1]

                else:
                    raise HyperheuristicError("Swap cannot be applied! current_cardinality < 2")

            elif action == "Mirror":
                # Mirror the sequence of the encoded_neighbour
                encoded_neighbour = np.copy(sol)
                if has_init_ops:
                    encoded_neighbour[1:] = encoded_neighbour[1:][::-1]
                else:
                    encoded_neighbour = encoded_neighbour[::-1]

            elif action == "Roll":
                # Move a step forward or backward, depending on a random variable, all the sequence
                encoded_neighbour = np.copy(sol)
                roll_step = 1 if random.random() < 0.5 else -1
                if has_init_ops:
                    encoded_neighbour[1:] = np.roll(encoded_neighbour[1:], roll_step)
                else:
                    encoded_neighbour = np.roll(encoded_neighbour, roll_step)

            elif action == "RollMany":
                # Move many (at random) steps forward or backward, depending on a random variable, all the sequence
                encoded_neighbour = np.copy(sol)
                roll_step = np.random.randint(current_cardinality) * (1 if random.random() < 0.5 else -1)
                if has_init_ops:
                    encoded_neighbour[1:] = np.roll(encoded_neighbour[1:], roll_step)
                else:
                    encoded_neighbour = np.roll(encoded_neighbour, roll_step)

            elif action == "Restart":
                # Restart the entire sequence
                encoded_neighbour = self._obtain_candidate_solution(current_cardinality)

            elif action == "ChangeInitOperator":
                # Swap the initialization operator at position 0 for another one
                init_candidates = [i for i in init_indices if i != sol[0]] if sol[0] in init_indices else init_indices
                encoded_neighbour = np.copy(sol)
                if init_candidates:
                    encoded_neighbour[0] = np.random.choice(init_candidates)

            else:
                raise HyperheuristicError(f"Invalid action = {action} to perform!")
        else:
            raise HyperheuristicError("Invalid type of current solution!")

        # Return the neighbour sequence
        return encoded_neighbour

    def _obtain_temperature(self, step_val, function="boltzmann"):
        """
        Return the updated temperature according to a defined scheme ``function``.
        :param int step_val:
            Step (or iteration) value of the current state of the hyper-heuristic search.
        :param str function: Optional.
            Mechanism for updating the temperature. It can be 'exponential', 'fast', or 'boltzmann'. The default
            is 'boltzmann'.
        :return: float
        """
        if function == "fast":
            return self.parameters["max_temperature"] / step_val

        elif function == "linear":
            return self.parameters["max_temperature"] - (1 - self.parameters["cooling_rate"]) * step_val

        elif function == "quadratic":
            return self.parameters["max_temperature"] / (1 + (1 - self.parameters["cooling_rate"]) * (step_val**2))

        elif function == "logarithmic":
            return self.parameters["max_temperature"] / (
                1 + (1 - self.parameters["cooling_rate"]) * np.log(step_val + 1)
            )

        elif function == "exponential":
            return self.parameters["max_temperature"] * np.power(1 - self.parameters["cooling_rate"], step_val)

        elif function == "boltzmann":
            return self.parameters["max_temperature"] / np.log(step_val + 1)

        else:
            raise HyperheuristicError("Invalid temperature scheme")

    def _check_acceptance(self, delta, acceptation_scheme="greedy", temp=1.0, energy_zero=1.0, prob=None):
        """
        Return a flag indicating if the current performance value can be accepted according to ``acceptation_scheme``.
        :param float delta:
            Energy change for determining the acceptance probability.
        :param str acceptation_scheme: Optional.
            Function for determining the acceptance probability. It can be 'exponential', 'boltzmann', 'probabilistic',
            or 'greedy'. The default is 'greedy'. For 'probabilistic' and 'greedy', temp and energy parameters are not
            used.
        :param float temp: Required for acceptation_scheme = ('exponential'|'boltzmann')
            Temperature value for determining the acceptance probability. The default value is 1.
        :param float energy_zero: Required for acceptation_scheme = ('exponential'|'boltzmann')
            Energy value to scale the temperature measurement. The default value is 1.
        :return: bool
        """

        if acceptation_scheme == "exponential":
            probability = np.min([np.exp(-delta / (energy_zero * temp)), 1]) if prob is None else prob
            if self.parameters["verbose"]:
                print(
                    f", [Delta: {delta:.2e}, ArgProb: {-delta / (energy_zero * temp):.2e}, Prob: {probability:.2f}]",
                    end=" ",
                )
            return np.random.rand() < probability
        elif acceptation_scheme == "boltzmann":
            probability = 1.0 / (1.0 + np.exp(delta / temp)) if prob is None else prob
            return (delta <= 0.0) or (np.random.rand() <= probability)
        elif acceptation_scheme == "probabilistic":
            probability = 0.25 if prob is None else prob
            return (delta < 0.0) or (np.random.rand() <= probability)
        else:  # Greedy
            return delta <= 0.0

    def __stagnation_check(self, stag_counter):
        return stag_counter > (self.parameters["stagnation_percentage"] * self.parameters["num_steps"])

    def _check_finalisation(self, step, stag_counter, *args):
        """
        General finalisation approach implemented for the methodology working as a hyper-heuristic. It mainly depends on
        `step` (current iteration number) and `stag_counter` (current stagnation iteration number). There are other
         variables that can be considered such as `temperature`. These additional variables must be args[0] < 0.0.
        """
        return (
            (step >= self.parameters["num_steps"])
            or (self.__stagnation_check(stag_counter) and not self.parameters["trial_overflow"])
            or (any(var < 0.0 for var in args))
        )


[docs]
    def get_operators(self, sequence):
        return [self.heuristic_space[index] for index in sequence]



[docs]
    def solve(self, mode=None, save_steps=True):
        mode = mode if mode is not None else self.parameters["solver"]

        if mode == "dynamic":
            return self._solve_dynamic(save_steps, initial_scheme=self.initial_scheme)
        elif mode == "neural_network":
            return self._solve_neural_network(save_steps)
        else:  # default: 'static'
            return self._solve_static(save_steps, initial_scheme=self.initial_scheme)


    def _solve_static(self, save_steps=True, initial_scheme="random"):
        """
        Run the hyper-heuristic based on Simulated Annealing (SA) to find the best metaheuristic. Each metaheuristic is
        run 'num_replicas' times to obtain statistics and then its performance. Once the process ends, it returns:
            - solution: The sequence of search operators that compose the metaheuristic.
            - performance: The metric value defined in ``get_performance``.
            - encoded_solution: The sequence of indices that correspond to the search operators.
            - historicals: A dictionary of information from each step. Its keys are: 'step', 'encoded_solution',
            'solution', 'performances', and 'details'. The latter, 'details', is also a dictionary which contains
            information about each replica carried out with the metaheuristic. Its fields are 'historical' (each
            iteration that the metaheuristic has performed), 'fitness', 'positions', and 'statistics'.
        :returns: solution (list), performance (float), encoded_solution (list)
        """

        # %% INITIALISER PART

        # PERTURBATOR (GENERATOR): Create the initial solution
        current_solution = self._obtain_candidate_solution()

        # Evaluate this solution
        current_performance, current_details = self.evaluate_candidate_solution(
            current_solution, initial_scheme=initial_scheme
        )

        # Initialise some additional variables
        initial_energy = np.abs(current_performance) + 1
        historical_current = [current_performance]
        historical_best = [current_performance]

        # SELECTOR: Initialise the best solution and its performance
        best_solution = np.copy(current_solution)
        best_performance = current_performance

        # Save this historical register, step = 0
        if save_steps:
            _save_step(
                0,
                {"encoded_solution": best_solution, "performance": best_performance, "details": current_details},
                self.file_label,
            )

        # Step, stagnation counter and its maximum value
        step = 0
        stag_counter = 0
        action = None
        temperature = self.parameters["max_temperature"]

        # Print the first status update, step = 0
        if self.parameters["verbose"]:
            print(
                "{} :: Step: {:4d}, Action: {:12s}, Temp: {:.2e}, Card: {:3d}, Perf: {:.2e} [Initial]".format(
                    self.file_label, step, "None", temperature, len(current_solution), current_performance
                )
            )

        # Perform a metaheuristic (now, Simulated Annealing) as hyper-heuristic process
        while not self._check_finalisation(step, stag_counter, temperature - self.parameters["min_temperature"]):
            # Update step and temperature
            step += 1
            temperature = self._obtain_temperature(step, self.parameters["temperature_scheme"])

            # Generate a neighbour solution (just indices-codes)
            action = self._choose_action(len(current_solution), action)
            candidate_solution = self._obtain_candidate_solution(sol=current_solution, action=action)

            # Evaluate this candidate solution
            candidate_performance, candidate_details = self.evaluate_candidate_solution(
                candidate_solution, initial_scheme=initial_scheme
            )

            # Print update
            if self.parameters["verbose"]:
                print(
                    f"{self.file_label} :: Step: {step:4d}, Action: {action:12s}, Temp: {temperature:.2e}, Card: {len(candidate_solution):3d}, "
                    + f"candPerf: {candidate_performance:.2e}, currPerf: {current_performance:.2e}, bestPerf: {best_performance:.2e}",
                    end=" ",
                )

            # Accept the current solution using a given acceptance_scheme
            if self._check_acceptance(
                candidate_performance - current_performance,
                self.parameters["acceptance_scheme"],
                temperature,
                initial_energy,
            ):

                # Update the current solution and its performance
                current_solution = np.copy(candidate_solution)
                current_performance = candidate_performance

                # Add acceptance mark
                if self.parameters["verbose"]:
                    print("A", end="")

            # If the candidate solution is better or equal than the current best solution
            if candidate_performance <= best_performance:

                # Update the best solution and its performance
                best_solution = np.copy(candidate_solution)
                best_performance = candidate_performance

                # Reset the stagnation counter
                stag_counter = 0

                # Save this information
                if save_steps:
                    _save_step(
                        step,
                        {
                            "encoded_solution": best_solution,
                            "performance": best_performance,
                            "details": candidate_details,
                        },
                        self.file_label,
                    )

                # Add improvement mark
                if self.parameters["verbose"]:
                    print("+", end="")
            else:
                # Update the stagnation counter
                stag_counter += 1

            historical_current.append(current_performance)
            historical_best.append(best_performance)
            # Add ending mark
            if self.parameters["verbose"]:
                print("")

        # Print the best one
        if self.parameters["verbose"]:
            print(f"\nBEST --> Perf: {best_performance}, e-Sol: {best_solution}")

        # Return the best solution found and its details
        return best_solution, best_performance, historical_current, historical_best

    def _solve_dynamic(self, save_steps=True, initial_scheme="random"):
        """
        Run the hyper-heuristic based on Simulated Annealing (SA) to find the best metaheuristic. Each metaheuristic is
        run 'num_replicas' times to obtain statistics and then its performance. Once the process ends, it returns:
            - solution: The sequence of search operators that compose the metaheuristic.
            - performance: The metric value defined in ``get_performance``.
            - encoded_solution: The sequence of indices that correspond to the search operators.
            - historicals: A dictionary of information from each step. Its keys are: 'step', 'encoded_solution',
            'solution', 'performances', and 'details'. The latter, 'details', is also a dictionary which contains
            information about each replica carried out with the metaheuristic. Its fields are 'historical' (each
            iteration that the metaheuristic has performed), 'fitness', 'positions', and 'statistics'.
        :returns: solution (list), performance (float), encoded_solution (list)
        """
        sequence_per_repetition = []
        fitness_per_repetition = []

        rep = 0
        while rep < self.parameters["num_replicas"]:
            # Call the metaheuristic
            mh = Metaheuristic(
                self.problem,
                num_agents=self.parameters["num_agents"],
                num_iterations=self.num_iterations,
                initial_scheme=initial_scheme,
            )

            # %% INITIALISER PART
            mh.apply_initialiser()

            # Extract the population and fitness values, and their best values
            current_fitness = np.copy(mh.pop.global_best_fitness)
            current_position = np.copy(mh.pop.rescale_back(mh.pop.global_best_position))

            # Heuristic sets
            self.current_space = np.arange(self.num_operators)

            # Initialise some additional variables
            candidate_enc_so = []  # This is a list of up to 1-length
            current_sequence = [-1]

            best_fitness = [current_fitness]
            best_position = [current_position]
            fitness_data = [np.copy(mh.pop.fitness)]
            positions_data = [np.copy(mh.pop.get_positions())]

            step = 0
            stag_counter = 0

            # We assume that with only one operator, it never reaches the solution. So, we check finalisation ending itr

            # FINALISATOR: Finalise due to other concepts
            while not self._check_finalisation(step, stag_counter):
                # Update the current set
                if self.parameters["trial_overflow"] and self.__stagnation_check(stag_counter):
                    possible_transitions = np.ones(self.num_operators) / self.num_operators
                    which_matrix = "random"
                else:
                    if not ((self.parameters["allow_weight_matrix"] is None) or (self.transition_matrix is None)):
                        if step < self.transition_matrix.shape[0]:
                            possible_transitions = self.transition_matrix[step]
                            transitions_sum = possible_transitions.sum()

                            if transitions_sum > 0.0:
                                possible_transitions = np.nan_to_num(possible_transitions / transitions_sum)
                            else:
                                possible_transitions = np.ones(self.num_operators) / self.num_operators

                            which_matrix = "transition"
                        else:
                            possible_transitions = np.ones(self.num_operators) / self.num_operators

                    else:
                        if self.weight_matrix is not None:
                            self.weights = self.weight_matrix[step]
                        possible_transitions = self.weights

                        which_matrix = "entered"

                # Pick randomly a simple heuristic
                candidate_enc_so = self._obtain_candidate_solution(sol=1, operators_weights=possible_transitions)

                # Prepare before evaluate the last search operator and apply it
                candidate_search_operator = self.get_operators([candidate_enc_so[-1]])
                mh.apply_search_operator(candidate_search_operator[0], candidate_search_operator[0][2])

                # Extract the population and fitness values, and their best values
                current_fitness = np.copy(mh.pop.global_best_fitness)
                current_position = np.copy(mh.pop.rescale_back(mh.pop.global_best_position))

                # Print update
                if self.parameters["verbose"]:
                    print(
                        "{} :: Rep: {:3d}, Step: {:3d}, Trial: {:3d}, SO: {:30s}, currPerf: {:.2e}, candPerf: {:.2e} "
                        "which: {:10s}".format(
                            self.file_label,
                            rep + 1,
                            step + 1,
                            stag_counter,
                            candidate_search_operator[0][0] + " & " + candidate_search_operator[0][2][:4],
                            best_fitness[-1],
                            current_fitness,
                            which_matrix,
                        ),
                        end=" ",
                    )

                # If the candidate solution is better or equal than the current best solution
                if self._check_acceptance(current_fitness - best_fitness[-1], "probabilistic", prob=0.2):

                    # Update the current sequence and its characteristics
                    current_sequence.append(candidate_enc_so[-1])

                    best_fitness.append(current_fitness)
                    best_position.append(current_position)
                    fitness_data.append(np.copy(mh.pop.fitness))
                    positions_data.append(np.copy(mh.pop.get_positions()))

                    # Update counters
                    step += 1
                    stag_counter = 0
                    self._trial_overflow = False

                    # Add improvement mark
                    if self.parameters["verbose"]:
                        print("+", end="")

                else:  # Then try another search operator

                    # Revert the modification to the population in the mh object
                    mh.pop.revert_positions()

                    # Update stagnation
                    stag_counter += 1

                # Add ending mark
                if self.parameters["verbose"]:
                    print("")

            # Print the best one
            if self.parameters["verbose"]:
                print(f"\nBest fitness: {current_fitness},\nBest position: {current_position}")

            #  Update the repetition register
            sequence_per_repetition.append(np.double(current_sequence).astype(int).tolist())
            fitness_per_repetition.append(np.double(best_fitness).tolist())

            # Update the weights for learning purposes
            self._update_weights(sequence_per_repetition)

            # Save this historical register
            if save_steps:
                _save_step(
                    rep + 1,
                    {
                        "encoded_solution": np.array(current_sequence),
                        "best_fitness": np.double(best_fitness),
                        "best_positions": np.double(best_position),
                        "details": {
                            "fitness_per_rep": fitness_per_repetition,
                            "sequence_per_rep": sequence_per_repetition,
                            "weight_matrix": self.weight_matrix,
                        },
                    },
                    self.file_label,
                )

            rep += 1
        # Return the best solution found and its details
        return fitness_per_repetition, sequence_per_repetition, self.transition_matrix

    def _solve_neural_network(self, save_steps=True):
        """
         Run the hyper-heuristic based on Neural Network (NN) to find the best metaheuristic. Given the current sequence of simple heuristics, the Neural Network model receives the task to predict which should be the following search operator. This method generates the training set to train the Neural Network model. A single Neural Network model is trained to generate unfolded metaheuristics (uMHs) for the given problem. After generating all uMHs, their fitness values are used to obtain statistics and then the performance of the HH. Once the process ends, it returns:
            - fitness_per_repetition: The list of fitnesses of all uMH generated by the model.
            - sequence_per_repetition: The list of uMHs generated by the model.
        This method requires a special dictionary in the ``hh_config'' with the following parameters:
            - model_architecture (str): Which Neural Network Architecture will be used.
            - model_architecture_layers (list): Hidden layer information.
            - sample_params (dict): Specification for the training set of the NN model.
            - fitness_to_weight (str): Function to convert fitnesses of uMHs to weight importance.
            - encoder (str): Which encoder will be used to convert the sequence of search operators to input for the NN model.
            - memory_length (int): Limit of search operators that would be considered to predict the following operator.
            - epochs (int): Number of epochs to train the NN model.
            - load_model (bool): True if it will load a pre-trained model.
            - save_model (bool): True if it will save the trained model.
        :returns list, list: fitness_per_repetition, sequence_per_repetition
        """
        sequence_per_repetition = []
        fitness_per_repetition = []

        # Neural network model that predicts operators
        model = self._get_neural_network_predictor()
        for rep in range(self.parameters["num_replicas"]):
            # Metaheuristic
            mh = Metaheuristic(
                self.problem,
                num_agents=self.parameters["num_agents"],
                num_iterations=self.num_iterations,
            )

            # Initialiser
            mh.apply_initialiser()

            # Extract the population and fitness values, and their best values
            current_fitness = np.copy(mh.pop.global_best_fitness)
            current_position = np.copy(mh.pop.rescale_back(mh.pop.global_best_position))

            # Heuristic sets
            self.current_space = np.arange(self.num_operators)

            # Initialise additional variables
            candidate_enc_so = []
            current_sequence = [-1]

            best_fitness = [current_fitness]
            best_position = [current_position]

            step = 0
            stag_counter = 0
            exclude_indices = []

            def normalize_weights(w):
                return w / sum(w) if sum(w) > 0 else np.ones(self.num_operators) / self.num_operators

            # normalize_weights = lambda w: w / sum(w) if sum(w) > 0 else np.ones(self.num_operators) / self.num_operators

            # Finalisator
            while not self._check_finalisation(step, stag_counter):
                # Use the trained model to predict operators weights
                if stag_counter == 0:
                    operator_prediction = model.predict(current_sequence)
                    operators_weights = normalize_weights(operator_prediction)

                # Select a simple heuristic and apply it
                candidate_enc_so = self._obtain_candidate_solution(sol=1, operators_weights=operators_weights)
                candidate_search_operator = self.get_operators([candidate_enc_so[-1]])
                perturbators, selectors = op.process_operators(candidate_search_operator)

                mh.apply_search_operator(perturbators[0], selectors[0])

                # Extract population and fitness values
                current_fitness = np.copy(mh.pop.global_best_fitness)
                current_position = np.copy(mh.pop.rescale_back(mh.pop.global_best_position))

                # Print update
                if self.parameters["verbose"]:
                    print(
                        "{} :: Neural Network, Rep: {:3d}, Step: {:3d}, Trial: {:3d}, SO: {:30s}, currPerf: {:.2e}, candPerf: {:.2e}, "
                        "csl: {:3d}".format(
                            self.file_label,
                            rep + 1,
                            step + 1,
                            stag_counter,
                            candidate_search_operator[0][0] + " & " + candidate_search_operator[0][2][:4],
                            best_fitness[-1],
                            current_fitness,
                            len(self.current_space),
                        ),
                        end=" ",
                    )

                # If the candidate solution is better or equal than the current best solution
                if current_fitness < best_fitness[-1]:
                    # Update the current sequence and its characteristics
                    current_sequence.append(candidate_enc_so[-1])

                    best_fitness.append(current_fitness)
                    best_position.append(current_position)

                    # Update counters
                    step += 1
                    stag_counter = 0
                    # Reset tabu list
                    exclude_indices = []

                    # Add improvement mark
                    if self.parameters["verbose"]:
                        print("+", end="")

                else:  # Then try another search operator
                    # Revert the modification to the population in the mh object
                    mh.pop.revert_positions()

                    # Update stagnation
                    stag_counter += 1
                    if stag_counter % self.parameters["tabu_idx"] == 0:
                        # Include last search operator's index to the tabu list
                        exclude_indices.append(candidate_enc_so[-1])
                        operator_prediction[exclude_indices[-1]] = 0
                        operators_weights = normalize_weights(operator_prediction)

                # Add ending mark
                if self.parameters["verbose"]:
                    print("")

            # Print the best one
            if self.parameters["verbose"]:
                print(f"\nBest fitness: {current_fitness},\nBest position: {current_position}")

            # Update the repetition register
            sequence_per_repetition.append(np.double(current_sequence).astype(int).tolist())
            fitness_per_repetition.append(np.double(best_fitness).tolist())

            # Save this historical register
            if save_steps:
                _save_step(
                    rep,
                    {
                        "encoded_solution": np.array(current_sequence),
                        "best_fitness": np.double(best_fitness),
                        "best_positions": np.double(best_position),
                        "details": {
                            "fitness_per_rep": fitness_per_repetition,
                            "sequence_per_rep": sequence_per_repetition,
                            "weight_matrix": self.transition_matrix,
                        },
                    },
                    self.file_label,
                )

        return fitness_per_repetition, sequence_per_repetition

    def _get_neural_network_predictor(self):
        # Prepare model params
        model_params = self.parameters["model_params"]
        model_params["file_label"] = self.file_label
        model_params["num_steps"] = self.parameters["num_steps"]
        model_params["num_operators"] = self.num_operators

        # Initialize model
        model = ModelPredictor(model_params)

        # Load pre-trained model
        if model_params["load_model"] and model.load():
            return model

        # Get training data
        seqfitness_train, seqrep_train = self._get_sample_sequences(model_params["sample_params"])
        dataset = DatasetSequences(
            seqrep_train,
            seqfitness_train,
            num_operators=self.num_operators,
            fitness_to_weight=model_params.get("fitness_to_weight", None),
        )
        X, y, sample_weight = dataset.obtain_dataset()

        # Fit model
        model.fit(
            X,
            y,
            model_params["epochs"],
            sample_weight=sample_weight,
            verbose=self.parameters["verbose"],
            early_stopping_params=model_params.get("early_stopping", None),
            verbose_statistics=self.parameters["verbose_statistics"],
        )

        # Save trained model
        if model_params["save_model"]:
            model.save()
        return model


[docs]
    def evaluate_candidate_solution(self, encoded_sequence, initial_scheme=None):
        """
        Evaluate the current sequence as a hyper/meta-heuristic. This process is repeated ``parameters['num_replicas']``
        times and, then, the performance is determined. In the end, the method returns the performance value and the
        details for all the runs. These details are ``historical_data``, ``fitness_data``, ``position_data``, and
        ``fitness_stats``. The elements from the ``encoded_sequence`` must be in the range of the ``num_operators``.
        :param list encoded_sequence:
            Sequence of search operators. These must be in the tuple form (decoded version). Check the ``metaheuristic``
            module for further information.
        :return float, dict: Performance and raw data.
        """
        _raw_scheme = self.initial_scheme if initial_scheme is None else initial_scheme
        initial_scheme = _raw_scheme if isinstance(_raw_scheme, tuple) else self._select_initial_scheme(_raw_scheme)

        # Decode the sequence corresponding to the hyper/meta-heuristic
        search_operators = encoded_sequence
        if len(encoded_sequence) == 0:
            raise HyperheuristicError("encoded_sequence cannot be empty")
        if isinstance(encoded_sequence[0], int | np.integer):
            search_operators = self.get_operators(np.asarray(encoded_sequence, dtype=int).tolist())

        # Extract an initialization operator from the head of the sequence (if present).
        # When found, it overrides initial_scheme and is removed from the search operator list.
        if search_operators and op._get_role(search_operators[0]) == "initialize":
            init_op = search_operators[0]
            initial_scheme = (init_op[0], init_op[1])  # ('scheme_name', {params})
            search_operators = search_operators[1:]
            if not search_operators:
                raise HyperheuristicError(
                    "encoded_sequence must contain at least one perturbation operator after the initialization operator"
                )

        # Metaheuristic expects operators as 3-tuples (name, params, selector).
        # Keep role handling at HH level and strip optional role suffix here.
        search_operators = [
            (op_tuple[0], op_tuple[1], op_tuple[2]) if len(op_tuple) > 3 else op_tuple for op_tuple in search_operators
        ]

        # Initialise the historical registers
        historical_data = []
        fitness_data = []
        position_data = []

        # Run the metaheuristic several times
        for _ in range(self.parameters["num_replicas"]):
            # Call the metaheuristic
            mh = Metaheuristic(
                self.problem,
                search_operators,
                self.parameters["num_agents"],
                self.num_iterations,
                initial_scheme=initial_scheme,
            )

            # Run this metaheuristic
            mh.run()

            # Store the historical values from this run
            historical_data.append(mh.historical)

            # Read and store the solution obtained
            _temporal_position, _temporal_fitness = mh.get_solution()
            fitness_data.append(_temporal_fitness)
            position_data.append(_temporal_position)

        # Determine a performance metric once finish the repetitions
        fitness_stats = self.get_statistics(fitness_data)

        # Return the performance value and the corresponding details
        return self.get_performance(fitness_stats), {
            "historical": historical_data,
            "fitness": fitness_data,
            "positions": position_data,
            "statistics": fitness_stats,
        }



[docs]
    def brute_force(self, save_steps=True):
        """
        This method performs a brute force procedure solving the problem via all the available search operators without
        integrating a high-level search method. So, each search operator is used as a 1-cardinality metaheuristic.
        Results are directly saved as json files.
        :return: None.
        """
        # Apply all the search operators in the collection as 1-cardinality MHs
        for operator_id in range(self.num_operators):
            # Read the corresponding operator
            operator = [self.heuristic_space[operator_id]]

            # Evaluate it within the metaheuristic structure
            operator_performance, operator_details = self.evaluate_candidate_solution(
                operator, initial_scheme=self.initial_scheme
            )

            # Save information
            if save_steps:
                _save_step(
                    operator_id,
                    {
                        "encoded_solution": operator_id,
                        "performance": operator_performance,
                        "statistics": operator_details["statistics"],
                    },
                    self.file_label,
                )

            # Print update
            if self.parameters["verbose"]:
                print(
                    f"{self.file_label} :: Operator {operator_id + 1} of {self.num_operators}, Perf: {operator_performance}"
                )



[docs]
    def basic_metaheuristics(self, save_steps=True):
        """
        This method performs a brute force procedure solving the problem via all the predefined metaheuristics in
        './collections/basicmetaheuristics.txt'. Many of them are 1-cardinality MHs but other are 2-cardinality ones.
        This process does not require a high-level search method. Results are directly saved as json files.
        :return: None.
        """
        # Apply all the search operators in the collection as 1-size MHs
        for operator_id in range(self.num_operators):
            operator = self.heuristic_space[operator_id]
            # Read the corresponding operator

            if isinstance(operator, tuple):
                operator = [operator]

            # Evaluate it within the metaheuristic structure
            operator_performance, operator_details = self.evaluate_candidate_solution(
                operator, initial_scheme=self.initial_scheme
            )

            # Save information
            if save_steps:
                _save_step(
                    operator_id,
                    {
                        "encoded_solution": operator_id,
                        "performance": operator_performance,
                        "statistics": operator_details["statistics"],
                    },
                    self.file_label,
                )

            # Print update
            if self.parameters["verbose"]:
                print(
                    f"{self.file_label} :: BasicMH {operator_id + 1} of {self.num_operators}, Perf: {operator_performance}"
                )



[docs]
    @staticmethod
    def get_performance(statistics):
        """
        Return the performance from fitness values obtained from running a metaheuristic several times. This method uses
        the Median and Interquartile Range values for such a purpose:
            performance = Med{fitness values} + IQR{fitness values}
        **Note:** If an alternative formula is needed, check the commented options.
        :param dict statistics: Statistics of the given MH/HH.
        :return: The computed performance.
        """
        # return statistics['Med']                                                                  # Option 1
        # return statistics['Avg'] + statistics['Std']                                              # Option 2
        return statistics["Med"] + statistics["IQR"]  # Option 3

        # return statistics['Avg'] + statistics['Std'] + statistics['Med'] + statistics['IQR']      # Option 4


[docs]
    @staticmethod
    def get_statistics(raw_data):
        """
        Return statistics from all the fitness values found after running a metaheuristic several times. The oncoming
        statistics are ``nob`` (number of observations), ``Min`` (minimum), ``Max`` (maximum), ``Avg`` (average),
        ``Std`` (standard deviation), ``Skw`` (skewness), ``Kur`` (kurtosis), ``IQR`` (interquartile range),
        ``Med`` (median), and ``MAD`` (Median absolute deviation).
        :param list raw_data: List of the fitness values.
        :return: dict: Statistics computed from the raw data.
        """
        # Get descriptive statistics
        dst = st.describe(raw_data)

        # Store statistics
        return {
            "nob": dst.nobs,
            "Min": dst.minmax[0],
            "Max": dst.minmax[1],
            "Avg": dst.mean,
            "Std": np.std(raw_data),
            "Skw": dst.skewness,
            "Kur": dst.kurtosis,
            "IQR": st.iqr(raw_data),
            "Med": np.median(raw_data),
            "MAD": st.median_abs_deviation(raw_data),
        }


    def _get_sample_sequences(self, sample_params):
        """
        Retrieve or generate sequences to use them as data train
        :param dict kw_sequences_params: Store the following values:
            :param bool retrieve_sequences: True if it would retrieve stored sequences, False if it would generate sequences for the given problem.
            :param int limit_seqs: The maximum number of sequences to be considered.
            :param float random: Proportion of random sequences to consider when using the dynamic solver to generate sequences.
            :param bool store_sequences: True if it wants to store the set of sequences.
        :return: A sample of sequences and their fitness for training
        """
        # Obtain sequences from previous generations
        if sample_params["retrieve_sequences"]:
            filters = {
                "collection": self.heuristic_space_label,
                "limit_seqs": sample_params.get("limit_seqs", 100),
                "dimensions": f'-{self.problem["dimensions"]}D-',
                "population": f'-{self.parameters["num_agents"]}pop-',
                "func_name": self.problem["func_name"],
            }
            seqfitness, seqrep = _get_stored_sample_sequences(filters)
        else:
            # Generate sequences from dynamic solver
            prev_num_replicas = self.parameters["num_replicas"]
            prev_learning_portion = self.parameters["learning_portion"]
            self.parameters["num_replicas"] = sample_params.get("limit_seqs", 100)
            self.parameters["learning_portion"] = sample_params.get("random", 0.37)
            seqfitness, seqrep, _ = self._solve_dynamic(save_steps=False)
            self.parameters["num_replicas"] = prev_num_replicas
            self.parameters["learning_portion"] = prev_learning_portion

        # Filter sequences with best performance
        if "filter" in sample_params:
            seqfitness_last = [sequence[-1] for sequence in seqfitness]
            if sample_params["filter"] == "first_quartile":
                top_value = np.quantile(seqfitness_last, 0.25)
            else:
                raise HyperheuristicError(f'"{sample_params["filter"]}" is not supported yet!')
            valid_indices = np.array(seqfitness_last) <= top_value
            seqfitness = (np.array(seqfitness)[valid_indices]).tolist()
            seqrep = (np.array(seqrep)[valid_indices]).tolist()

        # Verify that there is sequences for training
        if len(seqfitness) == 0 or len(seqrep) == 0:
            raise HyperheuristicError("There is no sample of sequences for training")

        # Store sequences if requested
        if sample_params["store_sequences"]:
            # Order sequences according to its fitness
            indices_order = list(range(len(seqfitness)))
            indices_order.sort(key=lambda idx: seqfitness[idx][-1])

            sequences_to_save = {}
            for idx in indices_order:
                sequences_to_save[idx] = (seqfitness[idx], seqrep[idx])

            # Store sequence without identificator of experiment : '-'.join(self.file_label.split('-')[:2]
            sequences_name = "-".join(
                [
                    self.problem["func_name"],
                    f'{self.problem["dimensions"]}D',
                    f'{self.parameters["num_agents"]}pop',
                    self.heuristic_space_label,
                    self.file_label,
                ]
            )
            _save_sequences(sequences_name, sequences_to_save)

        return seqfitness, seqrep

    def _update_weights(self, sequences=None):
        if (self.weights is None) or (
            len(sequences) < int(self.parameters["num_replicas"] * self.parameters["learning_portion"])
            if sequences is not None
            else False
        ):
            # Create the weights array using a uniform distribution
            self.weights = np.ones(self.num_operators) / self.num_operators
        else:
            # Get the matrix from sequences of num_operators -by- num_steps. Empties are filled with -2
            max_length = max([len(seq) for seq in sequences])
            mat_seq = np.array([np.array([*seq, *[-2] * (max_length - len(seq))]) for seq in sequences], dtype=object).T

            all_operators_including_empty = [-2.5, *np.arange(-2, self.num_operators) + 0.5]
            current_hist = []
            for ii_step in range(max_length):
                # Disregard the -2 and -1 operators (empty and initialiser)
                densities, _ = np.histogram(mat_seq[ii_step].tolist(), bins=all_operators_including_empty)
                temp_hist = densities[2:]
                if np.sum(temp_hist) > 0.0:
                    current_hist.append(np.ndarray.tolist(temp_hist / np.sum(temp_hist)))
                else:
                    current_hist.append(np.ndarray.tolist(np.ones(self.num_operators) / self.num_operators))

            self.transition_matrix = np.array(current_hist)



# %% ADDITIONAL TOOLS


def _save_step(step_number, variable_to_save, prefix=""):
    """
    This method saves all the information corresponding to specific step.
    :param int step_number:
        Value of the current step in the hyper-heuristic procedure. If it is not a hyper-heuristic, this integer
        corresponds to operator index.
    :param dict variable_to_save:
        Variables to save in dictionary format.
    :param str prefix: Optional.
        Additional information to be used in naming the file. The default is ''.
    :return:
    :rtype:
    """
    # Get the current date
    now = datetime.now()

    # Define the folder name
    if prefix != "":
        folder_name = "data_files/raw/" + prefix
    else:
        folder_name = "data_files/raw/" + "Exp-" + now.strftime("%m_%d_%Y")

    # Check if this path exists
    if not _check_path(folder_name):
        _create_path(folder_name)

    # Create a new file for this step
    with open(
        folder_name + f"/{str(step_number)}-" + now.strftime("%m_%d_%Y_%H_%M_%S") + ".json", "w", encoding="utf-8"
    ) as json_file:
        json.dump(variable_to_save, json_file, cls=jt.NumpyEncoder)


def _get_stored_sample_sequences(filters, folder_name="./data_files/sequences/"):
    """
    Search and read stored sequences that satisfy certain properties.
    :param dict filters: Dictionary with additional constraints.
    :param str folder_name: Folder that stores the sequences files.
    :return list, list: Return the list of sequences with their respective fitness.
    """
    if not _check_path(folder_name):
        return [], []

    # Filter stored sequences
    essential_attributes = ["func_name", "dimensions", "population", "collection"]

    def is_valid_file(file_name):
        # Verify that its a valid problem
        return all(filters[attribute] in file_name for attribute in essential_attributes)

    files_in_folder = jt.read_folder_files(folder_name)
    sequences_files = [file_name for file_name in files_in_folder if is_valid_file(file_name)]

    # Limit the number of sequences retrieved from a problem
    limit_seqs = filters["limit_seqs"]
    sequences_per_problem = {}

    # Extract sequences from stored sequences files
    seqfitness, seqrep = [], []
    for sequences_file in sequences_files:
        problem_name = sequences_file[: sequences_file.rfind(".")].split("-")[0]
        if problem_name not in sequences_per_problem:
            # Initialise counter per problem
            sequences_per_problem[problem_name] = 0

        # Check limit before read the json file
        if sequences_per_problem[problem_name] == limit_seqs:
            continue

        sequences_json = jt.read_json(folder_name + sequences_file)
        for fitness, sequence in sequences_json.values():
            # Check limit before append sequence
            if sequences_per_problem[problem_name] == limit_seqs:
                break

            # Append sequence
            seqfitness.append(fitness)
            seqrep.append(sequence)
            sequences_per_problem[problem_name] += 1
    return seqfitness, seqrep


def _save_sequences(file_name, sequences_to_save):
    """
    Save encoded sequences and its fitness to use them later to train ML models.
    :param str file_name: Name of the file where the sequences will be stored.
    :param dict sequences_to_save: Sequences that will be stored.
    :return: None.
    """
    # Define the folder name
    folder_name = "data_files/sequences/"

    # Check if this path exists
    if not _check_path(folder_name):
        _create_path(folder_name)

    # Overwrite or create file to store the sequences along its respective fitness
    with open(folder_name + f"{file_name}.json", "w", encoding="utf-8") as json_file:
        json.dump(sequences_to_save, json_file, cls=jt.NumpyEncoder)



[docs]
class HyperheuristicError(Exception):
    """
    Simple HyperheuristicError to manage exceptions.
    """

    pass