MultivariateFunctionPenaltyAdapter.java
- /*
- * Licensed to the Apache Software Foundation (ASF) under one or more
- * contributor license agreements. See the NOTICE file distributed with
- * this work for additional information regarding copyright ownership.
- * The ASF licenses this file to You under the Apache License, Version 2.0
- * (the "License"); you may not use this file except in compliance with
- * the License. You may obtain a copy of the License at
- *
- * https://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
- */
- /*
- * This is not the original file distributed by the Apache Software Foundation
- * It has been modified by the Hipparchus project
- */
- package org.hipparchus.optim.nonlinear.scalar;
- import org.hipparchus.analysis.MultivariateFunction;
- import org.hipparchus.exception.LocalizedCoreFormats;
- import org.hipparchus.exception.MathIllegalArgumentException;
- import org.hipparchus.util.FastMath;
- import org.hipparchus.util.MathUtils;
- /**
- * <p>Adapter extending bounded {@link MultivariateFunction} to an unbouded
- * domain using a penalty function.</p>
- *
- * <p>
- * This adapter can be used to wrap functions subject to simple bounds on
- * parameters so they can be used by optimizers that do <em>not</em> directly
- * support simple bounds.
- * </p>
- * <p>
- * The principle is that the user function that will be wrapped will see its
- * parameters bounded as required, i.e when its {@code value} method is called
- * with argument array {@code point}, the elements array will fulfill requirement
- * {@code lower[i] <= point[i] <= upper[i]} for all i. Some of the components
- * may be unbounded or bounded only on one side if the corresponding bound is
- * set to an infinite value. The optimizer will not manage the user function by
- * itself, but it will handle this adapter and it is this adapter that will take
- * care the bounds are fulfilled. The adapter {@link #value(double[])} method will
- * be called by the optimizer with unbound parameters, and the adapter will check
- * if the parameters is within range or not. If it is in range, then the underlying
- * user function will be called, and if it is not the value of a penalty function
- * will be returned instead.
- * </p>
- * <p>
- * This adapter is only a poor-man's solution to simple bounds optimization
- * constraints that can be used with simple optimizers like
- * {@link org.hipparchus.optim.nonlinear.scalar.noderiv.SimplexOptimizer
- * SimplexOptimizer}.
- * A better solution is to use an optimizer that directly supports simple bounds like
- * {@link org.hipparchus.optim.nonlinear.scalar.noderiv.CMAESOptimizer
- * CMAESOptimizer} or
- * {@link org.hipparchus.optim.nonlinear.scalar.noderiv.BOBYQAOptimizer
- * BOBYQAOptimizer}.
- * One caveat of this poor-man's solution is that if start point or start simplex
- * is completely outside of the allowed range, only the penalty function is used,
- * and the optimizer may converge without ever entering the range.
- * </p>
- *
- * @see MultivariateFunctionMappingAdapter
- *
- */
- public class MultivariateFunctionPenaltyAdapter
- implements MultivariateFunction {
- /** Underlying bounded function. */
- private final MultivariateFunction bounded;
- /** Lower bounds. */
- private final double[] lower;
- /** Upper bounds. */
- private final double[] upper;
- /** Penalty offset. */
- private final double offset;
- /** Penalty scales. */
- private final double[] scale;
- /**
- * Simple constructor.
- * <p>
- * When the optimizer provided points are out of range, the value of the
- * penalty function will be used instead of the value of the underlying
- * function. In order for this penalty to be effective in rejecting this
- * point during the optimization process, the penalty function value should
- * be defined with care. This value is computed as:</p>
- * <p>
- * penalty(point) = offset + ∑<sub>i</sub>[scale[i] * √|point[i]-boundary[i]|]
- * </p>
- * <p>
- * where indices i correspond to all the components that violates their boundaries.
- * </p>
- * <p>
- * So when attempting a function minimization, offset should be larger than
- * the maximum expected value of the underlying function and scale components
- * should all be positive. When attempting a function maximization, offset
- * should be lesser than the minimum expected value of the underlying function
- * and scale components should all be negative.
- * minimization, and lesser than the minimum expected value of the underlying
- * function when attempting maximization.
- * </p>
- * <p>
- * These choices for the penalty function have two properties. First, all out
- * of range points will return a function value that is worse than the value
- * returned by any in range point. Second, the penalty is worse for large
- * boundaries violation than for small violations, so the optimizer has an hint
- * about the direction in which it should search for acceptable points.
- * </p>
- * @param bounded bounded function
- * @param lower lower bounds for each element of the input parameters array
- * (some elements may be set to {@code Double.NEGATIVE_INFINITY} for
- * unbounded values)
- * @param upper upper bounds for each element of the input parameters array
- * (some elements may be set to {@code Double.POSITIVE_INFINITY} for
- * unbounded values)
- * @param offset base offset of the penalty function
- * @param scale scale of the penalty function
- * @exception MathIllegalArgumentException if lower bounds, upper bounds and
- * scales are not consistent, either according to dimension or to bounadary
- * values
- */
- public MultivariateFunctionPenaltyAdapter(final MultivariateFunction bounded,
- final double[] lower, final double[] upper,
- final double offset, final double[] scale) {
- // safety checks
- MathUtils.checkNotNull(lower);
- MathUtils.checkNotNull(upper);
- MathUtils.checkNotNull(scale);
- if (lower.length != upper.length) {
- throw new MathIllegalArgumentException(LocalizedCoreFormats.DIMENSIONS_MISMATCH,
- lower.length, upper.length);
- }
- if (lower.length != scale.length) {
- throw new MathIllegalArgumentException(LocalizedCoreFormats.DIMENSIONS_MISMATCH,
- lower.length, scale.length);
- }
- for (int i = 0; i < lower.length; ++i) {
- if (!(upper[i] >= lower[i])) { // NOPMD - the test is written in such a way it also fails for NaN
- throw new MathIllegalArgumentException(LocalizedCoreFormats.NUMBER_TOO_SMALL,
- upper[i], lower[i]);
- }
- }
- this.bounded = bounded;
- this.lower = lower.clone();
- this.upper = upper.clone();
- this.offset = offset;
- this.scale = scale.clone();
- }
- /**
- * Computes the underlying function value from an unbounded point.
- * <p>
- * This method simply returns the value of the underlying function
- * if the unbounded point already fulfills the bounds, and compute
- * a replacement value using the offset and scale if bounds are
- * violated, without calling the function at all.
- * </p>
- * @param point unbounded point
- * @return either underlying function value or penalty function value
- */
- @Override
- public double value(double[] point) {
- for (int i = 0; i < scale.length; ++i) {
- if ((point[i] < lower[i]) || (point[i] > upper[i])) {
- // bound violation starting at this component
- double sum = 0;
- for (int j = i; j < scale.length; ++j) {
- final double overshoot;
- if (point[j] < lower[j]) {
- overshoot = scale[j] * (lower[j] - point[j]);
- } else if (point[j] > upper[j]) {
- overshoot = scale[j] * (point[j] - upper[j]);
- } else {
- overshoot = 0;
- }
- sum += FastMath.sqrt(overshoot);
- }
- return offset + sum;
- }
- }
- // all boundaries are fulfilled, we are in the expected
- // domain of the underlying function
- return bounded.value(point);
- }
- }