CorrelatedVectorFactory.java

/*
 * Licensed to the Apache Software Foundation (ASF) under one or more
 * contributor license agreements.  See the NOTICE file distributed with
 * this work for additional information regarding copyright ownership.
 * The ASF licenses this file to You under the Apache License, Version 2.0
 * (the "License"); you may not use this file except in compliance with
 * the License.  You may obtain a copy of the License at
 *
 *      http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */

package org.apache.commons.math4.legacy.random;

import java.util.function.Supplier;

import org.apache.commons.rng.UniformRandomProvider;
import org.apache.commons.rng.sampling.distribution.ContinuousSampler;
import org.apache.commons.rng.sampling.distribution.ContinuousUniformSampler;
import org.apache.commons.rng.sampling.distribution.ZigguratNormalizedGaussianSampler;
import org.apache.commons.math4.legacy.exception.DimensionMismatchException;
import org.apache.commons.math4.core.jdkmath.JdkMath;
import org.apache.commons.math4.legacy.linear.RealMatrix;
import org.apache.commons.math4.legacy.linear.RectangularCholeskyDecomposition;

/**
 * Generates vectors with with correlated components.
 *
 * <p>Random vectors with correlated components are built by combining
 * the uncorrelated components of another random vector in such a way
 * that the resulting correlations are the ones specified by a positive
 * definite covariance matrix.</p>
 *
 * <p>The main use of correlated random vector generation is for Monte-Carlo
 * simulation of physical problems with several variables (for example to
 * generate error vectors to be added to a nominal vector). A particularly
 * common case is when the generated vector should be drawn from a
 * <a href="http://en.wikipedia.org/wiki/Multivariate_normal_distribution">
 * Multivariate Normal Distribution</a>, usually using Cholesky decomposition.
 * Other distributions are possible as long as the underlying sampler provides
 * normalized values (unit standard deviation).</p>
 *
 * <p>Sometimes, the covariance matrix for a given simulation is not
 * strictly positive definite. This means that the correlations are
 * not all independent from each other. In this case, however, the non
 * strictly positive elements found during the Cholesky decomposition
 * of the covariance matrix should not be negative either, they
 * should be null. Another non-conventional extension handling this case
 * is used here. Rather than computing <code>C = U<sup>T</sup> U</code>
 * where <code>C</code> is the covariance matrix and <code>U</code>
 * is an upper-triangular matrix, we compute <code>C = B B<sup>T</sup></code>
 * where <code>B</code> is a rectangular matrix having more rows than
 * columns. The number of columns of <code>B</code> is the rank of the
 * covariance matrix, and it is the dimension of the uncorrelated
 * random vector that is needed to compute the component of the
 * correlated vector. This class handles this situation automatically.</p>
 */
public class CorrelatedVectorFactory {
    /** Square root of three. */
    private static final double SQRT3 = JdkMath.sqrt(3);
    /** Mean vector. */
    private final double[] mean;
    /** Root of the covariance matrix. */
    private final RealMatrix root;
    /** Size of uncorrelated vector. */
    private final int lengthUncorrelated;
    /** Size of correlated vector. */
    private final int lengthCorrelated;

    /**
     * Correlated vector factory.
     *
     * @param mean Expected mean values of the components.
     * @param covariance Covariance matrix.
     * @param small Diagonal elements threshold under which columns are
     * considered to be dependent on previous ones and are discarded.
     * @throws org.apache.commons.math4.legacy.linear.NonPositiveDefiniteMatrixException
     * if the covariance matrix is not strictly positive definite.
     * @throws DimensionMismatchException if the mean and covariance
     * arrays dimensions do not match.
     */
    public CorrelatedVectorFactory(double[] mean,
                                   RealMatrix covariance,
                                   double small) {
        lengthCorrelated = covariance.getRowDimension();
        if (mean.length != lengthCorrelated) {
            throw new DimensionMismatchException(mean.length, lengthCorrelated);
        }
        this.mean = mean.clone();

        final RectangularCholeskyDecomposition decomposition
            = new RectangularCholeskyDecomposition(covariance, small);
        root = decomposition.getRootMatrix();

        lengthUncorrelated = decomposition.getRank();
    }

    /**
     * Null mean correlated vector factory.
     *
     * @param covariance Covariance matrix.
     * @param small Diagonal elements threshold under which columns are
     * considered to be dependent on previous ones and are discarded.
     * @throws org.apache.commons.math4.legacy.linear.NonPositiveDefiniteMatrixException
     * if the covariance matrix is not strictly positive definite.
     */
    public CorrelatedVectorFactory(RealMatrix covariance,
                                   double small) {
        this(new double[covariance.getRowDimension()],
             covariance,
             small);
    }

    /**
     * @param rng RNG.
     * @return a generator of vectors with correlated components sampled
     * from a uniform distribution.
     */
    public Supplier<double[]> uniform(UniformRandomProvider rng) {
        return with(new ContinuousUniformSampler(rng, -SQRT3, SQRT3));
    }

    /**
     * @param rng RNG.
     * @return a generator of vectors with correlated components sampled
     * from a normal distribution.
     */
    public Supplier<double[]> gaussian(UniformRandomProvider rng) {
        return with(new ZigguratNormalizedGaussianSampler(rng));
    }

    /**
     * @param sampler Generator of samples from a normalized distribution.
     * @return a generator of vectors with correlated components.
     */
    private Supplier<double[]> with(final ContinuousSampler sampler) {
        return new Supplier<double[]>() {
            @Override
            public double[] get() {
                // Uncorrelated vector.
                final double[] uncorrelated = new double[lengthUncorrelated];
                for (int i = 0; i < lengthUncorrelated; i++) {
                    uncorrelated[i] = sampler.sample();
                }

                // Correlated vector.
                final double[] correlated = mean.clone();
                for (int i = 0; i < correlated.length; i++) {
                    for (int j = 0; j < lengthUncorrelated; j++) {
                        correlated[i] += root.getEntry(i, j) * uncorrelated[j];
                    }
                }

                return correlated;
            }
        };
    }
}