#!/usr/bin/env python
# coding: utf-8
import numpy as np
from typing import Union, List
from ..custom.probabilistic_models import UniGauss
from ..custom.initialization_models import UniformGenInit, UniGaussGenInit
from ..eda import EDA
[docs]class UMDAc(EDA):
"""
Univariate marginal Estimation of Distribution algorithm continuous. New individuals are sampled
from a univariate normal probabilistic model. It can be used for hyper-parameter optimization
or to optimize a function.
UMDA [1] is a specific type of Estimation of Distribution Algorithm (EDA) where new individuals
are sampled from univariate normal distributions and are updated in each iteration of the
algorithm by the best individuals found in the previous iteration. In this implementation each
individual is an array of real data so new individuals are sampled from a univariate probabilistic
model updated in each iteration. Optionally it is possible to set lower bound to the standard
deviation of the normal distribution for the variables to avoid premature convergence.
This algorithms has been widely used for different applications such as in [2] where it is
applied to optimize the parameters of a quantum paremetric circuit and is shown how it outperforms
other approaches in specific situations.
Example:
This short example runs UMDAc for a benchmark function optimization problem in the continuous space.
.. code-block:: python
from EDAspy.benchmarks import ContinuousBenchmarkingCEC14
from EDAspy.optimization import UMDAc
n_vars = 10
benchmarking = ContinuousBenchmarkingCEC14(n_vars)
umda = UMDAc(size_gen=100, max_iter=100, dead_iter=10, n_variables=10, alpha=0.5,
lower_bound=-100, upper_bound=100)
eda_result = umda.minimize(benchmarking.cec4, True)
References:
[1]: LarraƱaga, P., & Lozano, J. A. (Eds.). (2001). Estimation of distribution algorithms:
A new tool for evolutionary computation (Vol. 2). Springer Science & Business Media.
[2]: Vicente P. Soloviev, Pedro LarraƱaga and Concha Bielza (2022, July). Quantum Parametric
Circuit Optimization with Estimation of Distribution Algorithms. In 2022 The Genetic and
Evolutionary Computation Conference (GECCO). DOI: https://doi.org/10.1145/3520304.3533963
"""
def __init__(self,
size_gen: int,
max_iter: int,
dead_iter: int,
n_variables: int,
lower_bound: Union[np.array, List[float], float] = None,
upper_bound: Union[np.array, List[float], float] = None,
alpha: float = 0.5,
vector: np.array = None,
lower_factor: float = 0.5,
elite_factor: float = 0.4,
disp: bool = True,
parallelize: bool = False,
init_data: np.array = None,
w_noise: float = .5):
r"""
:param size_gen: Population size of each generation.
:param max_iter: Maximum number of function evaluations.
:param dead_iter: Stopping criteria. Number of iterations after with no improvement after which EDA stops.
:param n_variables: Number of variables to be optimized.
:param lower_bound: lower bound for the uniform distribution sampling.
:param upper_bound: lower bound for the uniform distribution sampling.
:param alpha: Percentage of population selected to update the probabilistic model.
:param vector: Array with shape (2, n_variables) where rows are mean and std of the parameters to be optimized.
:param lower_factor: Lower bound imposed in std of the variables to not converge to std=0.
:param elite_factor: Percentage of previous population selected to add to new generation (elite approach).
:param disp: Set to True to print convergence messages.
:param parallelize: True if the evaluation of the solutions is desired to be parallelized in multiple cores.
:param init_data: Numpy array containing the data the EDA is desired to be initialized from. By default, an
initializer is used.
:param w_noise: Intensity of the Gaussian white noise added to each generation in order to avoid genetic drift.
:type w_noise: float
:type lower_bound: List of lower bounds of size equal to number of variables OR single bound to all dimensions.
:type upper_bound: List of upper bounds of size equal to number of variables OR single bound to all dimensions.
"""
self.vector = vector
self.lower_bound = lower_factor
self.names_vars = list(range(n_variables))
super().__init__(size_gen=size_gen, max_iter=max_iter, dead_iter=dead_iter, n_variables=n_variables,
alpha=alpha, elite_factor=elite_factor, disp=disp, parallelize=parallelize,
init_data=init_data, w_noise=w_noise)
if self.vector is not None:
assert self.vector.shape == (2, n_variables)
self.init = UniGaussGenInit(n_variables, means_vector=self.vector[0, :], stds_vector=self.vector[1, :])
else:
self.init = UniformGenInit(self.n_variables, lower_bound=lower_bound, upper_bound=upper_bound)
self.pm = UniGauss(self.names_vars, lower_factor)