1 /*
2 * Licensed to the Apache Software Foundation (ASF) under one or more
3 * contributor license agreements. See the NOTICE file distributed with
4 * this work for additional information regarding copyright ownership.
5 * The ASF licenses this file to You under the Apache License, Version 2.0
6 * (the "License"); you may not use this file except in compliance with
7 * the License. You may obtain a copy of the License at
8 *
9 * https://www.apache.org/licenses/LICENSE-2.0
10 *
11 * Unless required by applicable law or agreed to in writing, software
12 * distributed under the License is distributed on an "AS IS" BASIS,
13 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
14 * See the License for the specific language governing permissions and
15 * limitations under the License.
16 */
17
18 /*
19 * This is not the original file distributed by the Apache Software Foundation
20 * It has been modified by the Hipparchus project
21 */
22
23 package org.hipparchus.optim.nonlinear.scalar;
24
25 import org.hipparchus.analysis.MultivariateFunction;
26 import org.hipparchus.analysis.MultivariateVectorFunction;
27 import org.hipparchus.exception.LocalizedCoreFormats;
28 import org.hipparchus.exception.MathIllegalArgumentException;
29 import org.hipparchus.linear.RealMatrix;
30
31 /**
32 * This class converts
33 * {@link MultivariateVectorFunction vectorial objective functions} to
34 * {@link MultivariateFunction scalar objective functions}
35 * when the goal is to minimize them.
36 * <br>
37 * This class is mostly used when the vectorial objective function represents
38 * a theoretical result computed from a point set applied to a model and
39 * the models point must be adjusted to fit the theoretical result to some
40 * reference observations. The observations may be obtained for example from
41 * physical measurements whether the model is built from theoretical
42 * considerations.
43 * <br>
44 * This class computes a possibly weighted squared sum of the residuals, which is
45 * a scalar value. The residuals are the difference between the theoretical model
46 * (i.e. the output of the vectorial objective function) and the observations. The
47 * class implements the {@link MultivariateFunction} interface and can therefore be
48 * minimized by any optimizer supporting scalar objectives functions.This is one way
49 * to perform a least square estimation. There are other ways to do this without using
50 * this converter, as some optimization algorithms directly support vectorial objective
51 * functions.
52 * <br>
53 * This class support combination of residuals with or without weights and correlations.
54 *
55 * @see MultivariateFunction
56 * @see MultivariateVectorFunction
57 */
58
59 public class LeastSquaresConverter implements MultivariateFunction {
60 /** Underlying vectorial function. */
61 private final MultivariateVectorFunction function;
62 /** Observations to be compared to objective function to compute residuals. */
63 private final double[] observations;
64 /** Optional weights for the residuals. */
65 private final double[] weights;
66 /** Optional scaling matrix (weight and correlations) for the residuals. */
67 private final RealMatrix scale;
68
69 /**
70 * Builds a simple converter for uncorrelated residuals with identical
71 * weights.
72 *
73 * @param function vectorial residuals function to wrap
74 * @param observations observations to be compared to objective function to compute residuals
75 */
76 public LeastSquaresConverter(final MultivariateVectorFunction function,
77 final double[] observations) {
78 this.function = function;
79 this.observations = observations.clone();
80 this.weights = null;
81 this.scale = null;
82 }
83
84 /**
85 * Builds a simple converter for uncorrelated residuals with the
86 * specified weights.
87 * <p>
88 * The scalar objective function value is computed as:
89 * objective = ∑weight<sub>i</sub>(observation<sub>i</sub>-objective<sub>i</sub>)<sup>2</sup>
90 * </p>
91 * <p>
92 * Weights can be used for example to combine residuals with different standard
93 * deviations. As an example, consider a residuals array in which even elements
94 * are angular measurements in degrees with a 0.01° standard deviation and
95 * odd elements are distance measurements in meters with a 15m standard deviation.
96 * In this case, the weights array should be initialized with value
97 * 1.0/(0.01<sup>2</sup>) in the even elements and 1.0/(15.0<sup>2</sup>) in the
98 * odd elements (i.e. reciprocals of variances).
99 * </p>
100 * <p>
101 * The array computed by the objective function, the observations array and the
102 * weights array must have consistent sizes or a {@link MathIllegalArgumentException}
103 * will be triggered while computing the scalar objective.
104 * </p>
105 *
106 * @param function vectorial residuals function to wrap
107 * @param observations observations to be compared to objective function to compute residuals
108 * @param weights weights to apply to the residuals
109 * @throws MathIllegalArgumentException if the observations vector and the weights
110 * vector dimensions do not match (objective function dimension is checked only when
111 * the {@link #value(double[])} method is called)
112 */
113 public LeastSquaresConverter(final MultivariateVectorFunction function,
114 final double[] observations,
115 final double[] weights) {
116 if (observations.length != weights.length) {
117 throw new MathIllegalArgumentException(LocalizedCoreFormats.DIMENSIONS_MISMATCH,
118 observations.length, weights.length);
119 }
120 this.function = function;
121 this.observations = observations.clone();
122 this.weights = weights.clone();
123 this.scale = null;
124 }
125
126 /**
127 * Builds a simple converter for correlated residuals with the
128 * specified weights.
129 * <p>
130 * The scalar objective function value is computed as:
131 * objective = y<sup>T</sup>y with y = scale×(observation-objective)
132 * </p>
133 * <p>
134 * The array computed by the objective function, the observations array and the
135 * the scaling matrix must have consistent sizes or a {@link MathIllegalArgumentException}
136 * will be triggered while computing the scalar objective.
137 * </p>
138 *
139 * @param function vectorial residuals function to wrap
140 * @param observations observations to be compared to objective function to compute residuals
141 * @param scale scaling matrix
142 * @throws MathIllegalArgumentException if the observations vector and the scale
143 * matrix dimensions do not match (objective function dimension is checked only when
144 * the {@link #value(double[])} method is called)
145 */
146 public LeastSquaresConverter(final MultivariateVectorFunction function,
147 final double[] observations,
148 final RealMatrix scale) {
149 if (observations.length != scale.getColumnDimension()) {
150 throw new MathIllegalArgumentException(LocalizedCoreFormats.DIMENSIONS_MISMATCH,
151 observations.length, scale.getColumnDimension());
152 }
153 this.function = function;
154 this.observations = observations.clone();
155 this.weights = null;
156 this.scale = scale.copy();
157 }
158
159 /** {@inheritDoc} */
160 @Override
161 public double value(final double[] point) {
162 // compute residuals
163 final double[] residuals = function.value(point);
164 if (residuals.length != observations.length) {
165 throw new MathIllegalArgumentException(LocalizedCoreFormats.DIMENSIONS_MISMATCH,
166 residuals.length, observations.length);
167 }
168 for (int i = 0; i < residuals.length; ++i) {
169 residuals[i] -= observations[i];
170 }
171
172 // compute sum of squares
173 double sumSquares = 0;
174 if (weights != null) {
175 for (int i = 0; i < residuals.length; ++i) {
176 final double ri = residuals[i];
177 sumSquares += weights[i] * ri * ri;
178 }
179 } else if (scale != null) {
180 for (final double yi : scale.operate(residuals)) {
181 sumSquares += yi * yi;
182 }
183 } else {
184 for (final double ri : residuals) {
185 sumSquares += ri * ri;
186 }
187 }
188
189 return sumSquares;
190 }
191 }