documentation/reference/correlations_8cpp_source.html

//   OpenNN: Open Neural Networks Library

//   www.opennn.net

//

//   C O R R E L A T I O N S

//

//   Artificial Intelligence Techniques SL

//   artelnics@artelnics.com


#include "correlations.h"

#include "data_set.h"

#include "neural_network.h"

#include "training_strategy.h"


namespace OpenNN

{


Correlation linear_correlation(const ThreadPoolDevice* thread_pool_device,

                               const Tensor<type, 1>& x,

                               const Tensor<type, 1>& y)

{

#ifdef OPENNN_DEBUG


    const Index x_size = x.size();


    ostringstream buffer;


    if(x_size != y.size())

    {

        buffer << "OpenNN Exception: Vector Template.\n"

               << "Correlation linear_correlation(const Tensor<type, 1>&) const method.\n"

               << "Y size must be equal to X size.\n";


        throw logic_error(buffer.str());

    }


#endif


    Correlation linear_correlation;


    linear_correlation.correlation_type = CorrelationMethod::Linear;


    if(is_constant(y))

    {

        linear_correlation.a = y(0);

        linear_correlation.b = type(0);

        linear_correlation.r = type(1);


        return linear_correlation;

    }


    pair<Tensor<type, 1>, Tensor<type, 1>> filter_vectors = filter_missing_values_vector_vector(x,y);


    const Tensor<double, 1> x_filter = filter_vectors.first.cast<double>();

    const Tensor<double, 1> y_filter = filter_vectors.second.cast<double>();


    Tensor<double, 0> s_x;

    Tensor<double, 0> s_y;


    Tensor<double, 0> s_xx;

    Tensor<double, 0> s_yy;


    Tensor<double, 0> s_xy;


    s_x.device(*thread_pool_device) = x_filter.sum();

    s_y.device(*thread_pool_device) = y_filter.sum();

    s_xx.device(*thread_pool_device) = x_filter.square().sum();

    s_yy.device(*thread_pool_device) = y_filter.square().sum();

    s_xy.device(*thread_pool_device) = (y_filter*x_filter).sum();


    if(abs(s_x()) < NUMERIC_LIMITS_MIN

    && abs(s_y()) < NUMERIC_LIMITS_MIN

    && abs(s_xx()) < NUMERIC_LIMITS_MIN

    && abs(s_yy()) < NUMERIC_LIMITS_MIN

    && abs(s_xy()) < NUMERIC_LIMITS_MIN)

    {

        linear_correlation.a = type(0);


        linear_correlation.b = type(0);


        linear_correlation.r = type(1);

    }

    else

    {

        const Index n = x_filter.size();


        linear_correlation.a =

            type((s_y() * s_xx() - s_x() * s_xy())/(static_cast<double>(n) * s_xx() - s_x() * s_x()));


        linear_correlation.b =

            type(((static_cast<double>(n) * s_xy()) - (s_x() * s_y())) /((static_cast<double>(n) * s_xx()) - (s_x() * s_x())));


        if(sqrt((static_cast<double>(n) * s_xx() - s_x() * s_x()) *(static_cast<double>(n) * s_yy() - s_y() * s_y())) < NUMERIC_LIMITS_MIN)

        {

            linear_correlation.r = type(1);

        }

        else

        {

            linear_correlation.r =

                type((static_cast<double>(n) * s_xy() - s_x() * s_y()) /

                sqrt((static_cast<double>(n) * s_xx() - s_x() * s_x()) *(static_cast<double>(n) * s_yy() - s_y() * s_y())));

        }

    }


    return linear_correlation;

}


Correlation logarithmic_correlation(const ThreadPoolDevice* thread_pool_device, const Tensor<type, 1>& x, const Tensor<type, 1>& y)

{

#ifdef OPENNN_DEBUG


    Index n = y.size();


    const Index x_size = x.size();


    ostringstream buffer;


    if(x_size != n)

    {

        buffer << "OpenNN Exception: Vector Template.\n"

               << "Correlation "

               "logarithmic_correlation(const Tensor<type, 1>&) const "

               "method.\n"

               << "Y size must be equal to X size.\n";


        throw logic_error(buffer.str());

    }


#endif


    // Check negative values from x


    Correlation logarithmic_correlation;


    for(Index i = 0; i < x.dimension(0); i++)

    {

        if(!isnan(x(i)) && x(i) <= type(0))

        {

            logarithmic_correlation.r = type(NAN);


            return logarithmic_correlation;

        }

    }


    logarithmic_correlation = linear_correlation(thread_pool_device, x.log(), y);


    logarithmic_correlation.correlation_type = CorrelationMethod::Logarithmic;


    return logarithmic_correlation;

}


Correlation exponential_correlation(const ThreadPoolDevice* thread_pool_device, const Tensor<type, 1>& x, const Tensor<type, 1>& y)

{

#ifdef OPENNN_DEBUG


    ostringstream buffer;


    if(x.size() != y.size())

    {

        buffer << "OpenNN Exception: Vector Template.\n"

               << "Correlation "

               "exponential_correlation(const Tensor<type, 1>&, const Tensor<type, 1>&) const method.\n"

               << "Y size must be equal to X size.\n";


        throw logic_error(buffer.str());

    }


#endif


    // Check negative values from y


    Correlation exponential_correlation;


    for(Index i = 0; i < y.dimension(0); i++)

    {

        if(!isnan(y(i)) && y(i) <= type(0))

        {

            exponential_correlation.r = type(NAN);


            return exponential_correlation;

        }

    }


    exponential_correlation = linear_correlation(thread_pool_device, x, y.log());


    exponential_correlation.correlation_type = CorrelationMethod::Exponential;


    exponential_correlation.a = exp(exponential_correlation.a);

    exponential_correlation.b = exponential_correlation.b;


    return exponential_correlation;

}


Correlation power_correlation(const ThreadPoolDevice* thread_pool_device, const Tensor<type, 1>& x, const Tensor<type, 1>& y)

{

#ifdef OPENNN_DEBUG


    ostringstream buffer;


    if(x.size() != y.size())

    {

        buffer << "OpenNN Exception: Vector Template.\n"

               << "Correlation "

                  "power_correlation(const Tensor<type, 1>&) const "

                  "method.\n"

               << "Y size must be equal to X size.\n";


        throw logic_error(buffer.str());

    }


#endif


    // Check negative values from x and y


    Correlation power_correlation;


    for(Index i = 0; i < x.dimension(0); i++)

    {

        if(!isnan(x(i)) && x(i) <= type(0))

        {

            power_correlation.r = type(NAN);


            return power_correlation;

        }


        if(!isnan(y(i)) && y(i) <= type(0))

        {

            power_correlation.r = type(NAN);


            return power_correlation;

        }

    }


    power_correlation = linear_correlation(thread_pool_device, x.log(), y.log());


    power_correlation.correlation_type = CorrelationMethod::Power;


    power_correlation.a = exp(power_correlation.a);


    return power_correlation;

}


Correlation logistic_correlation_vector_vector(const ThreadPoolDevice* thread_pool_device, const Tensor<type, 1>& x, const Tensor<type, 1>& y)

{

    Correlation correlation;


    const Tensor<type, 2> data = assemble_vector_vector(x, y);


    DataSet data_set(data);

    data_set.set_training();


    data_set.set_columns_scalers(Scaler::MinimumMaximum);


    NeuralNetwork neural_network(NeuralNetwork::ProjectType::Classification, {1,1});


    neural_network.get_probabilistic_layer_pointer()->set_activation_function(ProbabilisticLayer::ActivationFunction::Logistic);


    TrainingStrategy training_strategy(&neural_network, &data_set);

    training_strategy.set_display(false);

    training_strategy.set_display_period(1);


    training_strategy.set_loss_method(TrainingStrategy::LossMethod::NORMALIZED_SQUARED_ERROR);

    training_strategy.get_loss_index_pointer()->set_regularization_method(LossIndex::RegularizationMethod::NoRegularization);


    training_strategy.set_optimization_method(TrainingStrategy::OptimizationMethod::LEVENBERG_MARQUARDT_ALGORITHM);


    training_strategy.perform_training();


    const Tensor<type, 2> inputs = data_set.get_input_data();

    const Tensor<type, 2> targets = data_set.get_target_data();

    const Tensor<type, 2> outputs = neural_network.calculate_outputs(inputs);


    // Logistic correlation


    const Eigen::array<Index, 1> vector{{x.size()}};


    correlation.r = linear_correlation(thread_pool_device, outputs.reshape(vector), targets.reshape(vector)).r;


    correlation.correlation_type = CorrelationMethod::Logistic;


    const Tensor<type, 1> coefficients = neural_network.get_parameters();


    correlation.a = coefficients(0);

    correlation.b = coefficients(1);


    if(correlation.b < type(0)) correlation.r *= type(-1);


    return correlation;

}


Correlation logistic_correlation_vector_matrix(const ThreadPoolDevice* thread_pool_device,

                                                  const Tensor<type, 1>& x,

                                                  const Tensor<type, 2>& y)

{

    Correlation correlation;


    const Tensor<type, 2> data = OpenNN::assemble_vector_matrix(x, y);


    Tensor<Index, 1> input_columns_indices(1);

    input_columns_indices(0) = 0;


    Tensor<Index, 1> target_columns_indices(y.dimension(1));

    for(Index i = 0; i < y.dimension(1); i++) target_columns_indices(i) = 1+i;


    DataSet data_set(data);


    data_set.set_input_target_columns(input_columns_indices, target_columns_indices);


    data_set.set_training();


    const Index input_variables_number = data_set.get_input_variables_number();

    const Index target_variables_number = data_set.get_target_variables_number();


    NeuralNetwork neural_network(NeuralNetwork::ProjectType::Classification, {input_variables_number, target_variables_number});

    neural_network.get_probabilistic_layer_pointer()->set_activation_function(ProbabilisticLayer::ActivationFunction::Logistic);


    TrainingStrategy training_strategy(&neural_network, &data_set);


    training_strategy.get_loss_index_pointer()->set_regularization_method(LossIndex::RegularizationMethod::NoRegularization);


    training_strategy.set_optimization_method(TrainingStrategy::OptimizationMethod::LEVENBERG_MARQUARDT_ALGORITHM);


    training_strategy.set_display(false);


    training_strategy.perform_training();


    // Logistic correlation


    const Tensor<type, 2> inputs = data_set.get_input_data();

    const Tensor<type, 2> targets = data_set.get_target_data();

    const Tensor<type, 2> outputs = neural_network.calculate_outputs(inputs);


    const Eigen::array<Index, 1> vector{{targets.size()}};


    correlation.r = linear_correlation(thread_pool_device, outputs.reshape(vector), targets.reshape(vector)).r;


    correlation.correlation_type = CorrelationMethod::Logistic;


    return correlation;

}


Correlation logistic_correlation_matrix_vector(const ThreadPoolDevice* thread_pool_device,

                                               const Tensor<type, 2>& x, const Tensor<type, 1>& y)

{

    return OpenNN::logistic_correlation_vector_matrix(thread_pool_device, y, x);

}


Correlation logistic_correlation_matrix_matrix(const ThreadPoolDevice* thread_pool_device, const Tensor<type, 2>& x, const Tensor<type, 2>& y)

{

    Correlation correlation;


    const Tensor<type, 2> data = OpenNN::assemble_matrix_matrix(x, y);


    Tensor<Index, 1> input_columns_indices(1);

    input_columns_indices(0) = 0;


    Tensor<Index, 1> target_columns_indices(y.dimension(1));

    for(Index i = 0; i < y.dimension(1); i++) target_columns_indices(i) = 1+i;


    DataSet data_set(data);


    data_set.set_input_target_columns(input_columns_indices, target_columns_indices);


    data_set.set_training();


    const Index input_variables_number = data_set.get_input_variables_number();

    const Index target_variables_number = data_set.get_target_variables_number();


    NeuralNetwork neural_network(NeuralNetwork::ProjectType::Classification, {input_variables_number, target_variables_number});

    neural_network.get_probabilistic_layer_pointer()->set_activation_function(ProbabilisticLayer::ActivationFunction::Logistic);


    TrainingStrategy training_strategy(&neural_network, &data_set);


    training_strategy.get_loss_index_pointer()->set_regularization_method(LossIndex::RegularizationMethod::NoRegularization);


    training_strategy.set_optimization_method(TrainingStrategy::OptimizationMethod::LEVENBERG_MARQUARDT_ALGORITHM);


    training_strategy.set_display(false);


    training_strategy.perform_training();


    // Logistic correlation


    const Tensor<type, 2> inputs = data_set.get_input_data();

    const Tensor<type, 2> targets = data_set.get_target_data();

    const Tensor<type, 2> outputs = neural_network.calculate_outputs(inputs);


    const Eigen::array<Index, 1> vector{{targets.size()}};


    correlation.r = linear_correlation(thread_pool_device, outputs.reshape(vector), targets.reshape(vector)).r;


    correlation.correlation_type = CorrelationMethod::Logistic;


    return correlation;

}


Correlation correlation(const ThreadPoolDevice* thread_pool_device, const Tensor<type, 2>& x, const Tensor<type, 2>& y)

{

    Correlation correlation;


    const Index x_rows = x.dimension(0);

    const Index x_columns = x.dimension(1);

    const Index y_columns = y.dimension(1);


    const bool x_binary = is_binary(x);

    const bool y_binary = is_binary(y);


    const Eigen::array<Index, 1> vector{{x_rows}};


    if(x_columns == 1 && y_columns == 1)

    {

        if(!x_binary && !y_binary)

        {

            const Correlation linear_correlation

                    = OpenNN::linear_correlation(thread_pool_device, x.reshape(vector), y.reshape(vector));


            const Correlation exponential_correlation

                    = OpenNN::exponential_correlation(thread_pool_device, x.reshape(vector), y.reshape(vector));


            const Correlation logarithmic_correlation

                    = OpenNN::logarithmic_correlation(thread_pool_device, x.reshape(vector), y.reshape(vector));


            const Correlation power_correlation

                    = OpenNN::power_correlation(thread_pool_device, x.reshape(vector), y.reshape(vector));


            Correlation strongest_correlation = linear_correlation;


            if(abs(exponential_correlation.r) > abs(strongest_correlation.r))

                strongest_correlation = exponential_correlation;


            if(abs(logarithmic_correlation.r) > abs(strongest_correlation.r))

                strongest_correlation = logarithmic_correlation;


            if(abs(power_correlation.r) > abs(strongest_correlation.r))

                strongest_correlation = power_correlation;


            return strongest_correlation;

        }

        else if(!x_binary && y_binary)

        {

            return OpenNN::logistic_correlation_vector_vector(thread_pool_device, x.reshape(vector), y.reshape(vector));

        }

        else if(x_binary && !y_binary)

        {

            return OpenNN::logistic_correlation_vector_vector(thread_pool_device, y.reshape(vector), x.reshape(vector));

        }

        else if(x_binary && y_binary)

        {

            return OpenNN::linear_correlation(thread_pool_device, x.reshape(vector), y.reshape(vector));

        }

    }

    else if(x_columns != 1 && y_columns == 1)

    {

        return OpenNN::logistic_correlation_matrix_vector(thread_pool_device, x, y.reshape(vector));

    }

    else if(x_columns == 1 && y_columns != 1)

    {

        return OpenNN::logistic_correlation_vector_matrix(thread_pool_device, x.reshape(vector), y);

    }

    else if(x_columns != 1 && y_columns != 1)

    {

        return OpenNN::logistic_correlation_matrix_matrix(thread_pool_device, x, y);

    }

    else

    {

        throw logic_error("Correlations Exception: Unknown case.");

    }


    return correlation;

}


pair<Tensor<type, 1>, Tensor<type, 1>> filter_missing_values_vector_vector(const Tensor<type, 1>& x, const Tensor<type, 1>& y)

{

    Index new_size = 0;


    for(Index i = 0; i < x.size(); i++)

    {

        if(!isnan(x(i)) && !isnan(y(i))) new_size++;

    }


    if(new_size == x.size())

    {

        return make_pair(x, y);

    }


    Tensor<type, 1> new_x(new_size);


    Tensor<type, 1> new_y(new_size);


    Index index = 0;


    for(Index i = 0; i < x.size(); i++)

    {

        if(!isnan(x(i)) && !isnan(y(i)))

        {

            new_x(index) = x(i);

            new_y(index) = y(i);


            index++;

        }

    }


    return make_pair(new_x, new_y);

}


pair<Tensor<type, 2>, Tensor<type, 2>> filter_missing_values_matrix_matrix(const Tensor<type, 2>& x, const Tensor<type, 2>& y)

{

    const Index rows_number = x.dimension(0);

    const Index x_columns_number = x.dimension(1);

    const Index y_columns_number = y.dimension(1);


    Index new_rows_number = 0;


    Tensor<bool, 1> not_NAN_row(rows_number);


    for(Index i = 0; i < rows_number; i++)

    {

        not_NAN_row(i) = true;


        if(float(isnan(y(i))))

        {

            not_NAN_row(i) = false;

        }

        else

        {

            for(Index j = 0; j < x_columns_number; j++)

            {

                if(float(isnan(x(i,j))))

                {

                    not_NAN_row(i) = false;

                    break;

                }

            }

        }


        if(not_NAN_row(i)) new_rows_number++;

    }


    Tensor<type, 2> new_x(new_rows_number, x_columns_number);


    Tensor<type, 2> new_y(new_rows_number,y_columns_number);


    Index index = 0;


    for(Index i = 0; i < rows_number; i++)

    {

        if(not_NAN_row(i))

        {

            for(Index j = 0; j < y_columns_number; j++)

            {

                new_y(index, j) = y(i,j);

            }


            for(Index j = 0; j < x_columns_number; j++)

            {

                new_x(index, j) = x(i, j);

            }


            index++;

        }

    }


    return make_pair(new_x, new_y);

}


Tensor<type, 1> autocorrelations(const ThreadPoolDevice* thread_pool_device, const Tensor<type, 1>& x, const Index& lags_number)

{

    Tensor<type, 1> autocorrelation(lags_number);


    const Index this_size = x.size();


    for(Index i = 0; i < lags_number; i++)

    {

        Tensor<type, 1> column_x(this_size-i);

        Tensor<type, 1> column_y(this_size-i);


        for(Index j = 0; j < this_size - i; j++)

        {

            column_x(j) = x(j);

            column_y(j) = x(j + i);

        }


        autocorrelation(i) = linear_correlation(thread_pool_device, column_x, column_y).r;

    }


    return autocorrelation;

}


Tensor<type, 1> cross_correlations(const ThreadPoolDevice* thread_pool_device,

                                   const Tensor<type, 1>& x, const Tensor<type, 1>& y, const Index& maximum_lags_number)

{

    if(y.size() != x.size())

    {

        ostringstream buffer;


        buffer << "OpenNN Exception: Correlations.\n"

               << "Tensor<type, 1> calculate_cross_correlation(const Tensor<type, 1>&) method.\n"

               << "Both vectors must have the same size.\n";


        throw logic_error(buffer.str());

    }


    Tensor<type, 1> cross_correlation(maximum_lags_number);


    const Index this_size = x.size();


    for(Index i = 0; i < maximum_lags_number; i++)

    {

        Tensor<type, 1> column_x(this_size-i);

        Tensor<type, 1> column_y(this_size-i);


        for(Index j = 0; j < this_size - i; j++)

        {

            column_x(j) = x(j);

            column_y(j) = y(j + i);

        }


        cross_correlation[i] = linear_correlation(thread_pool_device, column_x, column_y).r;

    }


    return cross_correlation;

}


Tensor<type, 2> get_correlation_values(const Tensor<Correlation, 2>& correlations)

{

    const Index rows_number = correlations.dimension(0);

    const Index columns_number = correlations.dimension(1);


    Tensor<type, 2> values(rows_number, columns_number);


    for(Index i = 0; i < rows_number; i++)

    {

        for(Index j = 0; j < columns_number; j++)

        {

            values(i,j) = correlations(i,j).r;

        }

    }


    return values;

}


}


// OpenNN: Open Neural Networks Library.

// Copyright(C) 2005-2021 Artificial Intelligence Techniques, SL.

//

// This library is free software; you can redistribute it and/or

// modify it under the terms of the GNU Lesser General Public

// License as published by the Free Software Foundation; either

// version 2.1 of the License, or any later version.

//

// This library is distributed in the hope that it will be useful,

// but WITHOUT ANY WARRANTY; without even the implied warranty of

// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU

// Lesser General Public License for more details.


// You should have received a copy of the GNU Lesser General Public

// License along with this library; if not, write to the Free Software

// Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA  02110-1301  USA

half_float::detail::sqrt
uint32 sqrt(uint32 &r, int &exp)
Definition: half.hpp:1480

half_float::abs
HALF_CONSTEXPR half abs(half arg)
Definition: half.hpp:2735

half_float::isnan
HALF_CONSTEXPR bool isnan(half arg)
Definition: half.hpp:4385

half_float::exp
half exp(half arg)
Definition: half.hpp:2936

OpenNN::Correlation::a
type a
Independent coefficient of the logistic function.
Definition: correlations.h:70

OpenNN::Correlation::correlation_type
CorrelationMethod correlation_type
Regression method type.
Definition: correlations.h:82

OpenNN::Correlation::r
type r
Correlation coefficient of the regression.
Definition: correlations.h:78

OpenNN::Correlation::b
type b
x coefficient of the logistic function.
Definition: correlations.h:74