documentation/reference/adaptive__moment__estimation_8cpp_source.html

 //   OpenNN: Open Neural Networks Library

//   www.opennn.net

//

//   A D A P T I V E   M O M E N T   E S T I M A T I O N

//

//   Artificial Intelligence Techniques SL

//   artelnics@artelnics.com


#include "adaptive_moment_estimation.h"


namespace OpenNN

{


AdaptiveMomentEstimation::AdaptiveMomentEstimation()

    :OptimizationAlgorithm()

{

     set_default();

}


AdaptiveMomentEstimation::AdaptiveMomentEstimation(LossIndex* new_loss_index_pointer)

    : OptimizationAlgorithm(new_loss_index_pointer)

{

    set_default();

}


AdaptiveMomentEstimation::~AdaptiveMomentEstimation()

{

}


const type& AdaptiveMomentEstimation::get_initial_learning_rate() const

{

    return initial_learning_rate;

}


const type& AdaptiveMomentEstimation::get_beta_1() const

{

    return beta_1;

}


const type& AdaptiveMomentEstimation::get_beta_2() const

{

    return beta_2;

}


const type& AdaptiveMomentEstimation::get_epsilon() const

{

    return epsilon;

}


const type& AdaptiveMomentEstimation::get_loss_goal() const

{

    return training_loss_goal;

}


const type& AdaptiveMomentEstimation::get_maximum_time() const

{

    return maximum_time;

}


void AdaptiveMomentEstimation::set_loss_index_pointer(LossIndex* new_loss_index_pointer)

{

    loss_index_pointer = new_loss_index_pointer;

}


void AdaptiveMomentEstimation::set_initial_learning_rate(const type& new_learning_rate)

{

    initial_learning_rate= new_learning_rate;

}


void AdaptiveMomentEstimation::set_beta_1(const type& new_beta_1)

{

    beta_1= new_beta_1;

}


void AdaptiveMomentEstimation::set_beta_2(const type& new_beta_2)

{

    beta_2= new_beta_2;

}


void AdaptiveMomentEstimation::set_epsilon(const type& new_epsilon)

{

    epsilon= new_epsilon;

}


void AdaptiveMomentEstimation::set_maximum_epochs_number(const Index& new_maximum_epochs_number)

{

#ifdef OPENNN_DEBUG


    if(new_maximum_epochs_number < static_cast<type>(0.0))

    {

        ostringstream buffer;


        buffer << "OpenNN Exception: AdaptiveMomentEstimation class.\n"

               << "void set_maximum_epochs_number(const type&) method.\n"

               << "Maximum epochs number must be equal or greater than 0.\n";


        throw logic_error(buffer.str());

    }


#endif


    // Set maximum_epochs number


    maximum_epochs_number = new_maximum_epochs_number;

}


void AdaptiveMomentEstimation::set_loss_goal(const type& new_loss_goal)

{

    training_loss_goal = new_loss_goal;

}


void AdaptiveMomentEstimation::set_maximum_time(const type& new_maximum_time)

{

#ifdef OPENNN_DEBUG


    if(new_maximum_time < static_cast<type>(0.0))

    {

        ostringstream buffer;


        buffer << "OpenNN Exception: AdaptiveMomentEstimation class.\n"

               << "void set_maximum_time(const type&) method.\n"

               << "Maximum time must be equal or greater than 0.\n";


        throw logic_error(buffer.str());

    }


#endif


    // Set maximum time


    maximum_time = new_maximum_time;

}


TrainingResults AdaptiveMomentEstimation::perform_training()

{

    TrainingResults results(maximum_epochs_number+1);


    check();


    // Start training


    if(display) cout << "Training with adaptive moment estimation \"Adam\" ...\n";


    // Data set


    DataSet* data_set_pointer = loss_index_pointer->get_data_set_pointer();


    const bool has_selection = data_set_pointer->has_selection();


    const Tensor<Index, 1> input_variables_indices = data_set_pointer->get_input_variables_indices();

    const Tensor<Index, 1> target_variables_indices = data_set_pointer->get_target_variables_indices();


    const Tensor<Index, 1> training_samples_indices = data_set_pointer->get_training_samples_indices();

    const Tensor<Index, 1> selection_samples_indices = data_set_pointer->get_selection_samples_indices();


    const Tensor<string, 1> inputs_names = data_set_pointer->get_input_variables_names();

    const Tensor<string, 1> targets_names = data_set_pointer->get_target_variables_names();


    const Tensor<Scaler, 1> input_variables_scalers = data_set_pointer->get_input_variables_scalers();

    const Tensor<Scaler, 1> target_variables_scalers = data_set_pointer->get_target_variables_scalers();


    const Tensor<Descriptives, 1> input_variables_descriptives = data_set_pointer->scale_input_variables();

    Tensor<Descriptives, 1> target_variables_descriptives;


    Index batch_size_training = 0;

    Index batch_size_selection = 0;


    const Index training_samples_number = data_set_pointer->get_training_samples_number();

    const Index selection_samples_number = data_set_pointer->get_selection_samples_number();


    training_samples_number < batch_samples_number

            ? batch_size_training = training_samples_number

            : batch_size_training = batch_samples_number;


    selection_samples_number < batch_samples_number && selection_samples_number != 0

            ? batch_size_selection = selection_samples_number

            : batch_size_selection = batch_samples_number;


    DataSetBatch batch_training(batch_size_training, data_set_pointer);

    DataSetBatch batch_selection(batch_size_selection, data_set_pointer);


    const Index training_batches_number = training_samples_number/batch_size_training;

    const Index selection_batches_number = selection_samples_number/batch_size_selection;


    Tensor<Index, 2> training_batches(training_batches_number, batch_size_training);

    Tensor<Index, 2> selection_batches(selection_batches_number, batch_size_selection);


    // Neural network


    NeuralNetwork* neural_network_pointer = loss_index_pointer->get_neural_network_pointer();


    neural_network_pointer->set_inputs_names(inputs_names);

    neural_network_pointer->set_outputs_names(targets_names);


    if(neural_network_pointer->has_scaling_layer())

    {

        ScalingLayer* scaling_layer_pointer = neural_network_pointer->get_scaling_layer_pointer();

        scaling_layer_pointer->set(input_variables_descriptives, input_variables_scalers);

    }


    if(neural_network_pointer->has_unscaling_layer())

    {

        target_variables_descriptives = data_set_pointer->scale_target_variables();


        UnscalingLayer* unscaling_layer_pointer = neural_network_pointer->get_unscaling_layer_pointer();

        unscaling_layer_pointer->set(target_variables_descriptives, target_variables_scalers);

    }


    NeuralNetworkForwardPropagation training_forward_propagation(batch_size_training, neural_network_pointer);

    NeuralNetworkForwardPropagation selection_forward_propagation(batch_size_selection, neural_network_pointer);


    // Loss index


    loss_index_pointer->set_normalization_coefficient();


    LossIndexBackPropagation training_back_propagation(batch_size_training, loss_index_pointer);

    LossIndexBackPropagation selection_back_propagation(batch_size_selection, loss_index_pointer);


    type training_error = type(0);

    type training_loss = type(0);


    type selection_error = type(0);


    Index selection_failures = 0;


    // Optimization algorithm


    AdaptiveMomentEstimationData optimization_data(this);


    bool stop_training = false;


    time_t beginning_time, current_time;

    time(&beginning_time);

    type elapsed_time = type(0);


    bool shuffle = false;


    if(neural_network_pointer->has_long_short_term_memory_layer()

    || neural_network_pointer->has_recurrent_layer())

        shuffle = false;


    // Main loop


    for(Index epoch = 0; epoch <= maximum_epochs_number; epoch++)

    {

        if(display && epoch%display_period == 0) cout << "Epoch: " << epoch << endl;


        training_batches = data_set_pointer->get_batches(training_samples_indices, batch_size_training, shuffle);


        const Index batches_number = training_batches.dimension(0);


        training_loss = type(0);

        training_error = type(0);


        optimization_data.iteration = 1;


        for(Index iteration = 0; iteration < batches_number; iteration++)

        {

            // Data set


            batch_training.fill(training_batches.chip(iteration, 0), input_variables_indices, target_variables_indices);


            // Neural network


            neural_network_pointer->forward_propagate(batch_training, training_forward_propagation);


            // Loss index


            loss_index_pointer->back_propagate(batch_training, training_forward_propagation, training_back_propagation);


            training_error += training_back_propagation.error;

            training_loss += training_back_propagation.loss;


            update_parameters(training_back_propagation, optimization_data);

        }


        // Loss


        training_loss /= static_cast<type>(batches_number);

        training_error /= static_cast<type>(batches_number);


        results.training_error_history(epoch) = training_error;


        if(has_selection)

        {

            selection_batches = data_set_pointer->get_batches(selection_samples_indices, batch_size_selection, shuffle);


            selection_error = type(0);


            for(Index iteration = 0; iteration < selection_batches_number; iteration++)

            {

                // Data set


                batch_selection.fill(selection_batches.chip(iteration,0), input_variables_indices, target_variables_indices);


                // Neural network


                neural_network_pointer->forward_propagate(batch_selection, selection_forward_propagation);


                // Loss


                loss_index_pointer->calculate_errors(batch_selection, selection_forward_propagation, selection_back_propagation);


                loss_index_pointer->calculate_error(batch_selection, selection_forward_propagation, selection_back_propagation);


                selection_error += selection_back_propagation.error;

            }


            selection_error /= static_cast<type>(selection_batches_number);


            results.selection_error_history(epoch) = selection_error;


            if(epoch != 0 && results.selection_error_history(epoch) > results.selection_error_history(epoch-1)) selection_failures++;

        }


        // Elapsed time


        time(&current_time);

        elapsed_time = static_cast<type>(difftime(current_time, beginning_time));


        if(display && epoch%display_period == 0)

        {

            cout << "Training error: " << training_error << endl;

            if(has_selection) cout << "Selection error: " << selection_error << endl;

            cout << "Elapsed time: " << write_time(elapsed_time) << endl;

        }


        // Training history


        if(epoch == maximum_epochs_number)

        {

            if(display) cout << "Epoch " << epoch << endl << "Maximum number of epochs reached: " << epoch << endl;


            stop_training = true;


            results.stopping_condition = StoppingCondition::MaximumEpochsNumber;

        }


        if(elapsed_time >= maximum_time)

        {

            if(display) cout << "Epoch " << epoch << endl << "Maximum training time reached: " << write_time(elapsed_time) << endl;


            stop_training = true;


            results.stopping_condition = StoppingCondition::MaximumTime;

        }


        if(training_loss <= training_loss_goal)

        {

            if(display) cout << "Epoch " << epoch << endl << "Loss goal reached: " << training_loss << endl;


            stop_training = true;


            results.stopping_condition  = StoppingCondition::LossGoal;

        }


        if(selection_failures >= maximum_selection_failures)

        {

            if(display) cout << "Epoch " << epoch << endl << "Maximum selection failures reached: " << selection_failures << endl;


            stop_training = true;


            results.stopping_condition = StoppingCondition::MaximumSelectionErrorIncreases;

        }


        if(stop_training)

        {

            results.resize_training_error_history(epoch+1);


            if(has_selection) results.resize_selection_error_history(epoch+1);

            else results.resize_selection_error_history(0);


            results.elapsed_time = write_time(elapsed_time);


            break;

        }


        if(epoch != 0 && epoch % save_period == 0) neural_network_pointer->save(neural_network_file_name);

    }


    data_set_pointer->unscale_input_variables(input_variables_descriptives);


    if(neural_network_pointer->has_unscaling_layer())

        data_set_pointer->unscale_target_variables(target_variables_descriptives);


    if(display) results.print();


    return results;

}


string AdaptiveMomentEstimation::write_optimization_algorithm_type() const

{

    return "ADAPTIVE_MOMENT_ESTIMATION";

}


Tensor<string, 2> AdaptiveMomentEstimation::to_string_matrix() const

{

    Tensor<string, 2> labels_values(9, 2);


    // Initial learning rate


    labels_values(0,0) = "Initial learning rate";

    labels_values(0,1) = to_string(double(initial_learning_rate));


    // Initial decay


    labels_values(1,0) = "Initial decay";

    labels_values(1,1) = to_string(double(initial_decay));


    // Beta 1


    labels_values(2,0) = "Beta 1";

    labels_values(2,1) = to_string(double(beta_1));


    // Beta 2


    labels_values(3,0) = "Beta 2";

    labels_values(3,1) = to_string(double(beta_2));


    // Epsilon


    labels_values(4,0) = "Epsilon";

    labels_values(4,1) = to_string(double(epsilon));


    // Training loss goal


    labels_values(5,0) = "Training loss goal";

    labels_values(5,1) = to_string(double(training_loss_goal));


    // Maximum epochs number


    labels_values(6,0) = "Maximum epochs number";

    labels_values(6,1) = to_string(maximum_epochs_number);


    // Maximum time


    labels_values(7,0) = "Maximum time";

    labels_values(7,1) = write_time(maximum_time);


    // Batch samples number


    labels_values(8,0) = "Batch samples number";

    labels_values(8,1) = to_string(batch_samples_number);


    return labels_values;

}


void AdaptiveMomentEstimation::write_XML(tinyxml2::XMLPrinter& file_stream) const

{

    ostringstream buffer;


    file_stream.OpenElement("AdaptiveMomentEstimation");


    // DataSetBatch size


    file_stream.OpenElement("BatchSize");


    buffer.str("");

    buffer << batch_samples_number;


    file_stream.PushText(buffer.str().c_str());


    file_stream.CloseElement();


    // Loss goal


    file_stream.OpenElement("LossGoal");


    buffer.str("");

    buffer << training_loss_goal;


    file_stream.PushText(buffer.str().c_str());


    file_stream.CloseElement();


    // Maximum iterations number


    file_stream.OpenElement("MaximumEpochsNumber");


    buffer.str("");

    buffer << maximum_epochs_number;


    file_stream.PushText(buffer.str().c_str());


    file_stream.CloseElement();


    // Maximum time


    file_stream.OpenElement("MaximumTime");


    buffer.str("");

    buffer << maximum_time;


    file_stream.PushText(buffer.str().c_str());


    file_stream.CloseElement();


    // Hardware use


    file_stream.OpenElement("HardwareUse");


    buffer.str("");

    buffer << this->get_hardware_use();


    file_stream.PushText(buffer.str().c_str());


    file_stream.CloseElement();


    // End element


    file_stream.CloseElement();

}


void AdaptiveMomentEstimation::from_XML(const tinyxml2::XMLDocument& document)

{

    const tinyxml2::XMLElement* root_element = document.FirstChildElement("AdaptiveMomentEstimation");


    if(!root_element)

    {

        ostringstream buffer;


        buffer << "OpenNN Exception: AdaptiveMomentEstimation class.\n"

               << "void from_XML(const tinyxml2::XMLDocument&) method.\n"

               << "Adaptive moment estimation element is nullptr.\n";


        throw logic_error(buffer.str());

    }


    // DataSetBatch size


    const tinyxml2::XMLElement* batch_size_element = root_element->FirstChildElement("BatchSize");


    if(batch_size_element)

    {

        const Index new_batch_size = static_cast<Index>(atoi(batch_size_element->GetText()));


        try

        {

            set_batch_samples_number(new_batch_size);

        }

        catch(const logic_error& e)

        {

            cerr << e.what() << endl;

        }

    }


    // Loss goal

    {

        const tinyxml2::XMLElement* element = root_element->FirstChildElement("LossGoal");


        if(element)

        {

            const type new_loss_goal = static_cast<type>(atof(element->GetText()));


            try

            {

                set_loss_goal(new_loss_goal);

            }

            catch(const logic_error& e)

            {

                cerr << e.what() << endl;

            }

        }

    }


    // Maximum eochs number

    {

        const tinyxml2::XMLElement* element = root_element->FirstChildElement("MaximumEpochsNumber");


        if(element)

        {

            const Index new_maximum_epochs_number = static_cast<Index>(atoi(element->GetText()));


            try

            {

                set_maximum_epochs_number(new_maximum_epochs_number);

            }

            catch(const logic_error& e)

            {

                cerr << e.what() << endl;

            }

        }

    }


    // Maximum time

    {

        const tinyxml2::XMLElement* element = root_element->FirstChildElement("MaximumTime");


        if(element)

        {

            const type new_maximum_time = static_cast<type>(atof(element->GetText()));


            try

            {

                set_maximum_time(new_maximum_time);

            }

            catch(const logic_error& e)

            {

                cerr << e.what() << endl;

            }

        }

    }


    // Hardware use

    {

        const tinyxml2::XMLElement* element = root_element->FirstChildElement("HardwareUse");


        if(element)

        {

            const string new_hardware_use = element->GetText();


            try

            {

                set_hardware_use(new_hardware_use);

            }

            catch(const logic_error& e)

            {

                cerr << e.what() << endl;

            }

        }

    }

}


void AdaptiveMomentEstimation::set_batch_samples_number(const Index& new_batch_samples_number)

{

    batch_samples_number = new_batch_samples_number;

}


void AdaptiveMomentEstimation::set_default()

{

    display_period = 100;

}


Index AdaptiveMomentEstimation::get_batch_samples_number() const

{

    return batch_samples_number;

}


void AdaptiveMomentEstimation::update_parameters(LossIndexBackPropagation& back_propagation,

                              AdaptiveMomentEstimationData& optimization_data)

{

    const type learning_rate =

        type(initial_learning_rate*

            sqrt(type(1) - pow(beta_2, static_cast<type>(optimization_data.iteration)))/

            (type(1) - pow(beta_1, static_cast<type>(optimization_data.iteration))));


    optimization_data.gradient_exponential_decay.device(*thread_pool_device)

            = optimization_data.gradient_exponential_decay*beta_1

            + back_propagation.gradient*(type(1) - beta_1);


    optimization_data.square_gradient_exponential_decay.device(*thread_pool_device)

            = optimization_data.square_gradient_exponential_decay*beta_2

            + back_propagation.gradient*back_propagation.gradient*(type(1) - beta_2);


    back_propagation.parameters.device(*thread_pool_device) -=

            optimization_data.gradient_exponential_decay*learning_rate/(optimization_data.square_gradient_exponential_decay.sqrt() + epsilon);


    optimization_data.iteration++;


    // Update parameters


    back_propagation.loss_index_pointer->get_neural_network_pointer()->set_parameters(back_propagation.parameters);

}


AdaptiveMomentEstimationData::AdaptiveMomentEstimationData()

{

}


AdaptiveMomentEstimationData::AdaptiveMomentEstimationData(AdaptiveMomentEstimation* new_stochastic_gradient_descent_pointer)

{

    set(new_stochastic_gradient_descent_pointer);

}


AdaptiveMomentEstimationData::~AdaptiveMomentEstimationData()

{

}


void AdaptiveMomentEstimationData::set(AdaptiveMomentEstimation* new_adaptive_moment_estimation_pointer)

{

    adaptive_moment_estimation_pointer = new_adaptive_moment_estimation_pointer;


    LossIndex* loss_index_pointer = new_adaptive_moment_estimation_pointer->get_loss_index_pointer();


    NeuralNetwork* neural_network_pointer = loss_index_pointer->get_neural_network_pointer();


    const Index parameters_number = neural_network_pointer->get_parameters_number();


    gradient_exponential_decay.resize(parameters_number);

    gradient_exponential_decay.setZero();


    square_gradient_exponential_decay.resize(parameters_number);

    square_gradient_exponential_decay.setZero();

}


void AdaptiveMomentEstimationData::print() const

{

    cout << "Gradient exponential decay:" << endl

         <<gradient_exponential_decay << endl;


    cout << "Square gradient exponential decay:" << endl

         << square_gradient_exponential_decay << endl;

}


}


// OpenNN: Open Neural Networks Library.

// Copyright(C) 2005-2021 Artificial Intelligence Techniques, SL.

//

// This library is free software; you can redistribute it and/or

// modify it under the terms of the GNU Lesser General Public

// License as published by the Free Software Foundation; either

// version 2.1 of the License, or any later version.

//

// This library is distributed in the hope that it will be useful,

// but WITHOUT ANY WARRANTY; without even the implied warranty of

// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU

// Lesser General Public License for more details.


// You should have received a copy of the GNU Lesser General Public

// License along with this library; if not, write to the Free Software

// Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA  02110-1301  USA

OpenNN::AdaptiveMomentEstimation
Definition: adaptive_moment_estimation.h:53

OpenNN::AdaptiveMomentEstimation::perform_training
TrainingResults perform_training()
Definition: adaptive_moment_estimation.cpp:206

OpenNN::AdaptiveMomentEstimation::get_epsilon
const type & get_epsilon() const
Returns epsilon.
Definition: adaptive_moment_estimation.cpp:70

OpenNN::AdaptiveMomentEstimation::set_loss_index_pointer
void set_loss_index_pointer(LossIndex *)
Definition: adaptive_moment_estimation.cpp:97

OpenNN::AdaptiveMomentEstimation::get_maximum_time
const type & get_maximum_time() const
Returns the maximum training time.
Definition: adaptive_moment_estimation.cpp:87

OpenNN::AdaptiveMomentEstimation::get_beta_2
const type & get_beta_2() const
Returns beta 2.
Definition: adaptive_moment_estimation.cpp:62

OpenNN::AdaptiveMomentEstimation::get_loss_goal
const type & get_loss_goal() const
Definition: adaptive_moment_estimation.cpp:79

OpenNN::AdaptiveMomentEstimation::from_XML
void from_XML(const tinyxml2::XMLDocument &)
Definition: adaptive_moment_estimation.cpp:595

OpenNN::AdaptiveMomentEstimation::set_default
void set_default()
Sets the members of the optimization algorithm object to their default values.
Definition: adaptive_moment_estimation.cpp:714

OpenNN::AdaptiveMomentEstimation::AdaptiveMomentEstimation
AdaptiveMomentEstimation()
Definition: adaptive_moment_estimation.cpp:18

OpenNN::AdaptiveMomentEstimation::initial_learning_rate
type initial_learning_rate
Initial learning rate.
Definition: adaptive_moment_estimation.h:130

OpenNN::AdaptiveMomentEstimation::get_beta_1
const type & get_beta_1() const
Returns beta 1.
Definition: adaptive_moment_estimation.cpp:54

OpenNN::AdaptiveMomentEstimation::set_epsilon
void set_epsilon(const type &)
Definition: adaptive_moment_estimation.cpp:133

OpenNN::AdaptiveMomentEstimation::to_string_matrix
Tensor< string, 2 > to_string_matrix() const
Writes as matrix of strings the most representative atributes.
Definition: adaptive_moment_estimation.cpp:472

OpenNN::AdaptiveMomentEstimation::beta_1
type beta_1
Exponential decay over gradient estimates.
Definition: adaptive_moment_estimation.h:138

OpenNN::AdaptiveMomentEstimation::write_optimization_algorithm_type
string write_optimization_algorithm_type() const
Return the algorithm optimum for your model.
Definition: adaptive_moment_estimation.cpp:464

OpenNN::AdaptiveMomentEstimation::set_initial_learning_rate
void set_initial_learning_rate(const type &)
Definition: adaptive_moment_estimation.cpp:106

OpenNN::AdaptiveMomentEstimation::set_maximum_time
void set_maximum_time(const type &)
Definition: adaptive_moment_estimation.cpp:178

OpenNN::AdaptiveMomentEstimation::set_loss_goal
void set_loss_goal(const type &)
Definition: adaptive_moment_estimation.cpp:169

OpenNN::AdaptiveMomentEstimation::epsilon
type epsilon
Small number to prevent any division by zero.
Definition: adaptive_moment_estimation.h:146

OpenNN::AdaptiveMomentEstimation::set_beta_2
void set_beta_2(const type &)
Definition: adaptive_moment_estimation.cpp:124

OpenNN::AdaptiveMomentEstimation::set_batch_samples_number
void set_batch_samples_number(const Index &new_batch_samples_number)
Set number of samples in each batch. Default 1000.
Definition: adaptive_moment_estimation.cpp:708

OpenNN::AdaptiveMomentEstimation::maximum_time
type maximum_time
Maximum training time. It is used as a stopping criterion.
Definition: adaptive_moment_estimation.h:164

OpenNN::AdaptiveMomentEstimation::set_maximum_epochs_number
void set_maximum_epochs_number(const Index &)
Definition: adaptive_moment_estimation.cpp:142

OpenNN::AdaptiveMomentEstimation::update_parameters
void update_parameters(LossIndexBackPropagation &, AdaptiveMomentEstimationData &)
Update iteration parameters.
Definition: adaptive_moment_estimation.cpp:728

OpenNN::AdaptiveMomentEstimation::initial_decay
type initial_decay
Learning rate decay over each update.
Definition: adaptive_moment_estimation.h:134

OpenNN::AdaptiveMomentEstimation::training_loss_goal
type training_loss_goal
Goal value for the loss. It is used as a stopping criterion.
Definition: adaptive_moment_estimation.h:152

OpenNN::AdaptiveMomentEstimation::~AdaptiveMomentEstimation
virtual ~AdaptiveMomentEstimation()
Destructor.
Definition: adaptive_moment_estimation.cpp:39

OpenNN::AdaptiveMomentEstimation::maximum_epochs_number
Index maximum_epochs_number
Maximum epochs number.
Definition: adaptive_moment_estimation.h:156

OpenNN::AdaptiveMomentEstimation::write_XML
void write_XML(tinyxml2::XMLPrinter &) const
Definition: adaptive_moment_estimation.cpp:528

OpenNN::AdaptiveMomentEstimation::batch_samples_number
Index batch_samples_number
Training and selection batch size.
Definition: adaptive_moment_estimation.h:168

OpenNN::AdaptiveMomentEstimation::maximum_selection_failures
Index maximum_selection_failures
Maximum number of times when selection error increases.
Definition: adaptive_moment_estimation.h:160

OpenNN::AdaptiveMomentEstimation::set_beta_1
void set_beta_1(const type &)
Definition: adaptive_moment_estimation.cpp:115

OpenNN::AdaptiveMomentEstimation::get_initial_learning_rate
const type & get_initial_learning_rate() const
Returns the initial learning rate.
Definition: adaptive_moment_estimation.cpp:46

OpenNN::AdaptiveMomentEstimation::beta_2
type beta_2
Exponential decay over square gradient estimates.
Definition: adaptive_moment_estimation.h:142

OpenNN::DataSet
This class represents the concept of data set for data modelling problems, such as approximation,...
Definition: data_set.h:57

OpenNN::DataSet::get_training_samples_number
Index get_training_samples_number() const
Returns the number of samples in the data set which will be used for training.
Definition: data_set.cpp:1382

OpenNN::DataSet::scale_target_variables
Tensor< Descriptives, 1 > scale_target_variables()
Definition: data_set.cpp:6298

OpenNN::DataSet::get_training_samples_indices
Tensor< Index, 1 > get_training_samples_indices() const
Returns the indices of the samples which will be used for training.
Definition: data_set.cpp:1073

OpenNN::DataSet::get_selection_samples_indices
Tensor< Index, 1 > get_selection_samples_indices() const
Returns the indices of the samples which will be used for selection.
Definition: data_set.cpp:1098

OpenNN::DataSet::unscale_input_variables
void unscale_input_variables(const Tensor< Descriptives, 1 > &)
Definition: data_set.cpp:6351

OpenNN::DataSet::get_target_variables_indices
Tensor< Index, 1 > get_target_variables_indices() const
Returns the indices of the target variables.
Definition: data_set.cpp:3094

OpenNN::DataSet::get_selection_samples_number
Index get_selection_samples_number() const
Returns the number of samples in the data set which will be used for selection.
Definition: data_set.cpp:1402

OpenNN::DataSet::unscale_target_variables
void unscale_target_variables(const Tensor< Descriptives, 1 > &)
Definition: data_set.cpp:6397

OpenNN::DataSet::get_target_variables_names
Tensor< string, 1 > get_target_variables_names() const
Definition: data_set.cpp:2215

OpenNN::DataSet::get_input_variables_indices
Tensor< Index, 1 > get_input_variables_indices() const
Returns the indices of the input variables.
Definition: data_set.cpp:3047

OpenNN::DataSet::get_input_variables_names
Tensor< string, 1 > get_input_variables_names() const
Definition: data_set.cpp:2184

OpenNN::DataSet::get_batches
Tensor< Index, 2 > get_batches(const Tensor< Index, 1 > &, const Index &, const bool &, const Index &buffer_size=100) const
Definition: data_set.cpp:1217

OpenNN::DataSet::scale_input_variables
Tensor< Descriptives, 1 > scale_input_variables()
Definition: data_set.cpp:6243

OpenNN::LossIndex
This abstract class represents the concept of loss index composed of an error term and a regularizati...
Definition: loss_index.h:48

OpenNN::LossIndex::get_neural_network_pointer
NeuralNetwork * get_neural_network_pointer() const
Returns a pointer to the neural network object associated to the error term.
Definition: loss_index.h:70

OpenNN::LossIndex::get_data_set_pointer
DataSet * get_data_set_pointer() const
Returns a pointer to the data set object associated to the error term.
Definition: loss_index.h:92

OpenNN::NeuralNetwork
Definition: neural_network.h:47

OpenNN::NeuralNetwork::get_scaling_layer_pointer
ScalingLayer * get_scaling_layer_pointer() const
Returns a pointer to the scaling layers object composing this neural network object.
Definition: neural_network.cpp:473

OpenNN::NeuralNetwork::has_long_short_term_memory_layer
bool has_long_short_term_memory_layer() const
Definition: neural_network.cpp:237

OpenNN::NeuralNetwork::has_scaling_layer
bool has_scaling_layer() const
Definition: neural_network.cpp:221

OpenNN::NeuralNetwork::has_unscaling_layer
bool has_unscaling_layer() const
Definition: neural_network.cpp:285

OpenNN::NeuralNetwork::has_recurrent_layer
bool has_recurrent_layer() const
Definition: neural_network.cpp:269

OpenNN::NeuralNetwork::forward_propagate
void forward_propagate(const DataSetBatch &, NeuralNetworkForwardPropagation &) const
Calculate forward propagation in neural network.
Definition: neural_network.cpp:1373

OpenNN::NeuralNetwork::save
void save(const string &) const
Definition: neural_network.cpp:2371

OpenNN::NeuralNetwork::set_parameters
void set_parameters(Tensor< type, 1 > &)
Definition: neural_network.cpp:1135

OpenNN::NeuralNetwork::get_unscaling_layer_pointer
UnscalingLayer * get_unscaling_layer_pointer() const
Returns a pointer to the unscaling layers object composing this neural network object.
Definition: neural_network.cpp:497

OpenNN::NeuralNetwork::set_inputs_names
void set_inputs_names(const Tensor< string, 1 > &)
Definition: neural_network.cpp:796

OpenNN::NeuralNetwork::get_parameters_number
Index get_parameters_number() const
Definition: neural_network.cpp:1044

OpenNN::NeuralNetwork::set_outputs_names
void set_outputs_names(const Tensor< string, 1 > &)
Definition: neural_network.cpp:805

OpenNN::OptimizationAlgorithm
Definition: optimization_algorithm.h:42

OpenNN::OptimizationAlgorithm::neural_network_file_name
string neural_network_file_name
Path where the neural network is saved.
Definition: optimization_algorithm.h:150

OpenNN::OptimizationAlgorithm::set_hardware_use
void set_hardware_use(const string &)
Set hardware to use. Default: Multi-core.
Definition: optimization_algorithm.cpp:85

OpenNN::OptimizationAlgorithm::get_hardware_use
string get_hardware_use() const
Hardware use.
Definition: optimization_algorithm.cpp:77

OpenNN::OptimizationAlgorithm::loss_index_pointer
LossIndex * loss_index_pointer
Pointer to a loss index for a neural network object.
Definition: optimization_algorithm.h:128

OpenNN::OptimizationAlgorithm::check
virtual void check() const
Definition: optimization_algorithm.cpp:260

OpenNN::OptimizationAlgorithm::display
bool display
Display messages to screen.
Definition: optimization_algorithm.h:154

OpenNN::OptimizationAlgorithm::write_time
const string write_time(const type &) const
Writes the time from seconds in format HH:mm:ss.
Definition: optimization_algorithm.cpp:483

OpenNN::OptimizationAlgorithm::save_period
Index save_period
Number of iterations between the training saving progress.
Definition: optimization_algorithm.h:146

OpenNN::OptimizationAlgorithm::get_loss_index_pointer
LossIndex * get_loss_index_pointer() const
Definition: optimization_algorithm.cpp:54

OpenNN::OptimizationAlgorithm::display_period
Index display_period
Number of iterations between the training showing progress.
Definition: optimization_algorithm.h:142

OpenNN::ScalingLayer
This class represents a layer of scaling neurons.
Definition: scaling_layer.h:38

OpenNN::ScalingLayer::set
void set()
Sets the scaling layer to be empty.
Definition: scaling_layer.cpp:290

OpenNN::UnscalingLayer
This class represents a layer of unscaling neurons.
Definition: unscaling_layer.h:40

OpenNN::UnscalingLayer::set
void set()
Sets the unscaling layer to be empty.
Definition: unscaling_layer.cpp:273

tinyxml2::XMLDocument
Definition: tinyxml2.h:1653

tinyxml2::XMLElement
Definition: tinyxml2.h:1243

tinyxml2::XMLPrinter
Definition: tinyxml2.h:2154

tinyxml2::XMLPrinter::PushText
void PushText(const char *text, bool cdata=false)
Add a text node.
Definition: tinyxml2.cpp:2878

tinyxml2::XMLPrinter::CloseElement
virtual void CloseElement(bool compactMode=false)
If streaming, close the Element.
Definition: tinyxml2.cpp:2834

half_float::pow
half pow(half x, half y)
Definition: half.hpp:3427

OpenNN::AdaptiveMomentEstimationData
Definition: adaptive_moment_estimation.h:178

OpenNN::AdaptiveMomentEstimationData::AdaptiveMomentEstimationData
AdaptiveMomentEstimationData()
Default constructor.
Definition: adaptive_moment_estimation.cpp:755

OpenNN::DataSetBatch
Definition: data_set.h:887

OpenNN::LossIndexBackPropagation
Definition: loss_index.h:290

OpenNN::NeuralNetworkForwardPropagation
Definition: neural_network.h:262

OpenNN::TrainingResults
This structure contains the optimization algorithm results.
Definition: optimization_algorithm.h:198

OpenNN::TrainingResults::selection_error_history
Tensor< type, 1 > selection_error_history
History of the selection error over the training iterations.
Definition: optimization_algorithm.h:279

OpenNN::TrainingResults::resize_training_error_history
void resize_training_error_history(const Index &)
Resizes the training error history keeping the values.
Definition: optimization_algorithm.cpp:438

OpenNN::TrainingResults::stopping_condition
OptimizationAlgorithm::StoppingCondition stopping_condition
Stopping condition of the algorithm.
Definition: optimization_algorithm.h:257

OpenNN::TrainingResults::resize_selection_error_history
void resize_selection_error_history(const Index &)
Resizes the selection error history keeping the values.
Definition: optimization_algorithm.cpp:461

OpenNN::TrainingResults::training_error_history
Tensor< type, 1 > training_error_history
History of the loss function loss over the training iterations.
Definition: optimization_algorithm.h:275

OpenNN::TrainingResults::elapsed_time
string elapsed_time
Elapsed time of the training process.
Definition: optimization_algorithm.h:283