n2p2/doxygen/Training_8cpp_source.html

// n2p2 - A neural network potential package

// Copyright (C) 2018 Andreas Singraber (University of Vienna)

//

// This program is free software: you can redistribute it and/or modify

// it under the terms of the GNU General Public License as published by

// the Free Software Foundation, either version 3 of the License, or

// (at your option) any later version.

//

// This program is distributed in the hope that it will be useful,

// but WITHOUT ANY WARRANTY; without even the implied warranty of

// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the

// GNU General Public License for more details.

//

// You should have received a copy of the GNU General Public License

// along with this program.  If not, see <https://www.gnu.org/licenses/>.


#include "Training.h"

#include "Eigen/src/Core/Matrix.h"

#include "GradientDescent.h"

#include "KalmanFilter.h"

#include "NeuralNetwork.h"

#include "utility.h"

#include "mpi-extra.h"

#ifdef _OPENMP

#include <omp.h>

#endif

#include <algorithm> // std::sort, std::fill, std::find

#include <cmath>     // fabs

#include <cstdlib>   // atoi

#include <gsl/gsl_rng.h>

#include <limits>    // std::numeric_limits

#include <stdexcept> // std::runtime_error, std::range_error

#include <utility>   // std::piecewise_construct, std::forward_as_tuple


using namespace std;

using namespace nnp;


Training::Training() : Dataset(),

                       updaterType                (UT_GD          ),

                       parallelMode               (PM_TRAIN_RK0   ),

                       jacobianMode               (JM_SUM         ),

                       updateStrategy             (US_COMBINED    ),

                       hasUpdaters                (false          ),

                       hasStructures              (false          ),

                       useForces                  (false          ),

                       repeatedEnergyUpdates      (false          ),

                       freeMemory                 (false          ),

                       writeTrainingLog           (false          ),

                       stage                      (0              ),

                       numUpdaters                (0              ),

                       numEpochs                  (0              ),

                       epoch                      (0              ),

                       writeWeightsEvery          (0              ),

                       writeWeightsAlways         (0              ),

                       writeNeuronStatisticsEvery (0              ),

                       writeNeuronStatisticsAlways(0              ),

                       numWeights                 (0              ),

                       forceWeight                (0.0            ),

                       trainingLogFileName        ("train-log.out")

{

    sw["setup"].start();

}


Training::~Training()

{

    for (vector<Updater*>::iterator it = updaters.begin();

         it != updaters.end(); ++it)

    {

        if (updaterType == UT_GD)

        {

            delete dynamic_cast<GradientDescent*>(*it);

        }

        else if (updaterType == UT_KF)

        {

            delete dynamic_cast<KalmanFilter*>(*it);

        }

    }


    if (trainingLog.is_open()) trainingLog.close();

}


void Training::selectSets()

{

    log << "\n";

    log << "*** DEFINE TRAINING/TEST SETS ***********"

           "**************************************\n";

    log << "\n";


    vector<string> pCheck = {"force", "charge"};

    bool check = false;

    for (auto k : pk)

    {

        check |= (find(pCheck.begin(), pCheck.end(), k) != pCheck.end());

    }

    vector<size_t> numAtomsPerElement(numElements, 0);


    double testSetFraction = atof(settings["test_fraction"].c_str());

    log << strpr("Desired test set ratio      : %f\n", testSetFraction);

    if (structures.size() > 0) hasStructures = true;

    else hasStructures = false;


    string k;

    for (size_t i = 0; i < structures.size(); ++i)

    {

        Structure& s = structures.at(i);

        // Only select set if not already determined.

        if (s.sampleType == Structure::ST_UNKNOWN)

        {

            double const r = gsl_rng_uniform(rng);

            if (r < testSetFraction) s.sampleType = Structure::ST_TEST;

            else                     s.sampleType = Structure::ST_TRAINING;

        }

        if (s.sampleType == Structure::ST_TEST)

        {

            size_t const& na = s.numAtoms;

            k = "energy"; if (p.exists(k)) p[k].numTestPatterns++;

            k = "force";  if (p.exists(k)) p[k].numTestPatterns += 3 * na;

            if (nnpType == NNPType::HDNNP_4G)

            {

                k = "charge"; if (p.exists(k)) p[k].numTestPatterns++;

            }

            else

            {

                k = "charge"; if (p.exists(k)) p[k].numTestPatterns += na;

            }

        }

        else if (s.sampleType == Structure::ST_TRAINING)

        {

            for (size_t j = 0; j < numElements; ++j)

            {

                numAtomsPerElement.at(j) += s.numAtomsPerElement.at(j);

            }


            k = "energy";

            if (p.exists(k))

            {

                p[k].numTrainPatterns++;

                p[k].updateCandidates.push_back(UpdateCandidate());

                p[k].updateCandidates.back().s = i;

            }

            k = "force";

            if (p.exists(k))

            {

                p[k].numTrainPatterns += 3 * s.numAtoms;


                if (nnpType == NNPType::HDNNP_4G)

                {

                    p[k].updateCandidates.push_back(UpdateCandidate());

                    p[k].updateCandidates.back().s = i;

                }

                for (auto &ai : s.atoms)

                {

                    for (size_t j = 0; j < 3; ++j)

                    {

                        if (nnpType != NNPType::HDNNP_4G)

                        {

                            p[k].updateCandidates.push_back(UpdateCandidate());

                            p[k].updateCandidates.back().s = i;

                        }

                        p[k].updateCandidates.back().subCandidates

                            .push_back(SubCandidate());

                        p[k].updateCandidates.back().subCandidates

                            .back().a = ai.index;

                        p[k].updateCandidates.back().subCandidates

                            .back().c = j;

                    }

                }

            }

            k = "charge";

            if (p.exists(k))

            {

                if (nnpType == NNPType::HDNNP_4G)

                {

                    p[k].numTrainPatterns++;

                    p[k].updateCandidates.push_back(UpdateCandidate());

                    p[k].updateCandidates.back().s = i;

                }

                else

                {

                    p[k].numTrainPatterns += s.numAtoms;

                    for (vector<Atom>::const_iterator it = s.atoms.begin();

                         it != s.atoms.end(); ++it)

                    {

                        p[k].updateCandidates.push_back(UpdateCandidate());

                        p[k].updateCandidates.back().s = i;

                        p[k].updateCandidates.back().subCandidates

                            .push_back(SubCandidate());

                        p[k].updateCandidates.back().subCandidates.back().a

                            = it->index;

                    }

                }


            }

        }

        else

        {

            log << strpr("WARNING: Structure %zu not assigned to either "

                         "training or test set.\n", s.index);

        }

    }

    for (size_t i = 0; i < numElements; ++i)

    {

        if (hasStructures && (numAtomsPerElement.at(i) == 0))

        {

            log << strpr("WARNING: Process %d has no atoms of element "

                         "%d (%2s).\n",

                         myRank,

                         i,

                         elementMap[i].c_str());

        }

    }

    for (auto k : pk)

    {

        MPI_Allreduce(MPI_IN_PLACE, &(p[k].numTrainPatterns), 1, MPI_SIZE_T, MPI_SUM, comm);

        MPI_Allreduce(MPI_IN_PLACE, &(p[k].numTestPatterns) , 1, MPI_SIZE_T, MPI_SUM, comm);

        double sum = p[k].numTrainPatterns + p[k].numTestPatterns;

        log << "Training/test split of data set for property \"" + k + "\":\n";

        log << strpr("- Total    patterns : %.0f\n", sum);

        log << strpr("- Training patterns : %d\n", p[k].numTrainPatterns);

        log << strpr("- Test     patterns : %d\n", p[k].numTestPatterns);

        log << strpr("- Test set fraction : %f\n", p[k].numTestPatterns / sum);

    }


    log << "*****************************************"

           "**************************************\n";


    return;

}


void Training::writeSetsToFiles()

{

    log << "\n";

    log << "*** WRITE TRAINING/TEST SETS ************"

           "**************************************\n";

    log << "\n";


    string fileName = strpr("train.data.%04d", myRank);

    ofstream fileTrain;

    fileTrain.open(fileName.c_str());

    if (!fileTrain.is_open())

    {

        runtime_error(strpr("ERROR: Could not open file %s\n",

                            fileName.c_str()));

    }

    fileName = strpr("test.data.%04d", myRank);

    ofstream fileTest;

    fileTest.open(fileName.c_str());

    if (!fileTest.is_open())

    {

        runtime_error(strpr("ERROR: Could not open file %s\n",

                            fileName.c_str()));

    }

    for (vector<Structure>::iterator it = structures.begin();

         it != structures.end(); ++it)

    {

        // Energy offsets are already subtracted at this point.

        // Here, we quickly add them again to provide consistent data sets.

        addEnergyOffset(*it);

        if (it->sampleType == Structure::ST_TRAINING)

        {

            it->writeToFile(&fileTrain);

        }

        else if (it->sampleType == Structure::ST_TEST)

        {

            it->writeToFile(&fileTest);

        }

        // Subtract energy offsets again.

        removeEnergyOffset(*it);

    }

    fileTrain.flush();

    fileTrain.close();

    fileTest.flush();

    fileTest.close();

    MPI_Barrier(comm);

    if (myRank == 0)

    {

        log << "Writing training/test set to files:\n";

        log << " - train.data\n";

        log << " - test.data\n";

        fileName = "train.data";

        combineFiles(fileName);

        fileName = "test.data";

        combineFiles(fileName);

    }


    log << "*****************************************"

           "**************************************\n";


    return;

}


void Training::initializeWeights()

{

    log << "\n";

    log << "*** WEIGHT INITIALIZATION ***************"

           "**************************************\n";

    log << "\n";


    if (settings.keywordExists("nguyen_widrow_weights_short") &&

        settings.keywordExists("precondition_weights"))

    {

        throw runtime_error("ERROR: Nguyen Widrow and preconditioning weights"

                            " initialization are incompatible\n");

    }


    // Training stage 2 requires electrostatics NN weights from file.

    if ((nnpType == NNPType::HDNNP_4G && stage == 2) ||

        (nnpType == NNPType::HDNNP_Q  && stage == 2))

    {

        log << "Setting up " + nns.at("elec").name + " neural networks:\n";

        readNeuralNetworkWeights("elec", nns.at("elec").weightFileFormat);

    }


    // Currently trained NN weights may be read from file or randomized.

    NNSetup const& nn = nns.at(nnId);

    log << "Setting up " + nn.name + " neural networks:\n";

    if (settings.keywordExists("use_old_weights" + nn.keywordSuffix2))

    {

        log << "Reading old weights from files.\n";

        readNeuralNetworkWeights(nnId, nn.weightFileFormat);

    }

    else randomizeNeuralNetworkWeights(nnId);


    log << "*****************************************"

           "**************************************\n";


    return;

}


void Training::initializeWeightsMemory(UpdateStrategy updateStrategy)

{

    this->updateStrategy = updateStrategy;

    numWeights= 0;

    if (updateStrategy == US_COMBINED)

    {

        log << strpr("Combined updater for all elements selected: "

                     "UpdateStrategy::US_COMBINED (%d)\n", updateStrategy);

        numUpdaters = 1;

        log << strpr("Number of weight updaters    : %zu\n", numUpdaters);

        for (size_t i = 0; i < numElements; ++i)

        {

            weightsOffset.push_back(numWeights);

            numWeights += elements.at(i).neuralNetworks.at(nnId)

                          .getNumConnections();

            // sqrt of Hardness of element is included in weights vector

            if (nnpType == NNPType::HDNNP_4G && stage == 1) numWeights ++;

        }

        weights.resize(numUpdaters);

        weights.at(0).resize(numWeights, 0.0);

        numWeightsPerUpdater.push_back(numWeights);

        log << strpr("Total fit parameters         : %zu\n", numWeights);

    }

    else if (updateStrategy == US_ELEMENT)

    {

        log << strpr("Separate updaters for elements selected: "

                     "UpdateStrategy::US_ELEMENT (%d)\n", updateStrategy);

        numUpdaters = numElements;

        log << strpr("Number of weight updaters    : %zu\n", numUpdaters);

        weights.resize(numUpdaters);

        for (size_t i = 0; i < numUpdaters; ++i)

        {

            size_t n = elements.at(i).neuralNetworks.at(nnId)

                       .getNumConnections();

            weights.at(i).resize(n, 0.0);

            numWeightsPerUpdater.push_back(n);

            log << strpr("Fit parameters for element %2s: %zu\n",

                         elements.at(i).getSymbol().c_str(),

                         n);

        }

    }

    else

    {

        throw runtime_error("ERROR: Unknown update strategy.\n");

    }


    return;

}


void Training::setStage(size_t stage)

{

    this->stage = stage;


    // NNP of type HDNNP_2G trains <properties> -> <network>:

    //   "energy" (optionally: "force") -> "short"

    if (nnpType == NNPType::HDNNP_2G)

    {

        pk.push_back("energy");

        if (settings.keywordExists("use_short_forces")) pk.push_back("force");

        nnId = "short";

    }

    // NNP of type HDNNP_4G or HDNNP_Q trains <properties> -> <network>:

    // * stage 1: "charge" -> "elec"

    // * stage 2: "energy" (optionally: "force") -> "short"

    else if (nnpType == NNPType::HDNNP_4G ||

             nnpType == NNPType::HDNNP_Q)

    {

        if (stage == 1)

        {

            pk.push_back("charge");

            nnId = "elec";

        }

        else if (stage == 2)

        {

            pk.push_back("energy");

            if (settings.keywordExists("use_short_forces"))

            {

                pk.push_back("force");

            }

            nnId = "short";

        }

        else

        {

            throw runtime_error(strpr("ERROR: No or incorrect training stage "

                                      "specified: %zu (must be 1 or 2).\n",

                                      stage));

        }

    }


    // Initialize all training properties which will be used.

    auto initP = [this](string key) {p.emplace(piecewise_construct,

                                               forward_as_tuple(key),

                                               forward_as_tuple(key));

                 };

    for (auto k : pk) initP(k);


    return;

}


void Training::dataSetNormalization()

{

    log << "\n";

    log << "*** DATA SET NORMALIZATION **************"

           "**************************************\n";

    log << "\n";


    log << "Computing statistics from reference data and initial "

           "prediction...\n";

    log << "\n";


    bool useForcesLocal = settings.keywordExists("use_short_forces");


    if ( (nnpType == NNPType::HDNNP_4G || nnpType == NNPType::HDNNP_Q) &&

          stage == 1)

    {

        throw runtime_error("ERROR: Normalization of charges not yet "

                            "implemented\n.");

    }

    writeWeights("short", "weights.%03zu.norm");

    if ( (nnpType == NNPType::HDNNP_4G || nnpType == NNPType::HDNNP_Q) &&

          stage == 2)

    {

        writeWeights("elec", "weightse.%03zu.norm");

    }


    ofstream fileEvsV;

    fileEvsV.open(strpr("evsv.dat.%04d", myRank).c_str());

    if (myRank == 0)

    {

        // File header.

        vector<string> title;

        vector<string> colName;

        vector<string> colInfo;

        vector<size_t> colSize;

        title.push_back("Energy vs. volume comparison.");

        colSize.push_back(16);

        colName.push_back("V_atom");

        colInfo.push_back("Volume per atom.");

        colSize.push_back(16);

        colName.push_back("Eref_atom");

        colInfo.push_back("Reference energy per atom.");

        colSize.push_back(10);

        colName.push_back("N");

        colInfo.push_back("Number of atoms.");

        colSize.push_back(16);

        colName.push_back("V");

        colInfo.push_back("Volume of structure.");

        colSize.push_back(16);

        colName.push_back("Eref");

        colInfo.push_back("Reference energy of structure.");

        colSize.push_back(16);

        colName.push_back("Eref_offset");

        colInfo.push_back("Reference energy of structure (including offset).");

        appendLinesToFile(fileEvsV,

                          createFileHeader(title, colSize, colName, colInfo));

    }


    size_t numAtomsTotal         = 0;

    size_t numStructures         = 0;

    double meanEnergyPerAtomRef  = 0.0;

    double meanEnergyPerAtomNnp  = 0.0;

    double sigmaEnergyPerAtomRef = 0.0;

    double sigmaEnergyPerAtomNnp = 0.0;

    double meanForceRef          = 0.0;

    double meanForceNnp          = 0.0;

    double sigmaForceRef         = 0.0;

    double sigmaForceNnp         = 0.0;

    for (auto& s : structures)

    {

        // File output for evsv.dat.

        fileEvsV << strpr("%16.8E %16.8E %10zu %16.8E %16.8E %16.8E\n",

                          s.volume / s.numAtoms,

                          s.energyRef / s.numAtoms,

                          s.numAtoms,

                          s.volume,

                          s.energyRef,

                          getEnergyWithOffset(s, true));

        s.calculateNeighborList(maxCutoffRadius);

        // TODO: handle 4G case

#ifdef N2P2_NO_SF_GROUPS

        calculateSymmetryFunctions(s, true);

#else

        calculateSymmetryFunctionGroups(s, true);

#endif

        calculateAtomicNeuralNetworks(s, true);

        calculateEnergy(s);

        if (useForcesLocal) calculateForces(s);

        s.clearNeighborList();


        numStructures++;

        numAtomsTotal += s.numAtoms;

        meanEnergyPerAtomRef += s.energyRef / s.numAtoms;

        meanEnergyPerAtomNnp += s.energy    / s.numAtoms;

        for (auto& a : s.atoms)

        {

            meanForceRef += a.fRef[0] + a.fRef[1] + a.fRef[2];

            meanForceNnp += a.f   [0] + a.f   [1] + a.f   [2];

        }

    }


    fileEvsV.flush();

    fileEvsV.close();

    MPI_Barrier(MPI_COMM_WORLD);

    log << "Writing energy/atom vs. volume/atom data to \"evsv.dat\".\n";

    if (myRank == 0) combineFiles("evsv.dat");

    MPI_Allreduce(MPI_IN_PLACE, &numStructures       , 1, MPI_SIZE_T, MPI_SUM, MPI_COMM_WORLD);

    MPI_Allreduce(MPI_IN_PLACE, &numAtomsTotal       , 1, MPI_SIZE_T, MPI_SUM, MPI_COMM_WORLD);

    MPI_Allreduce(MPI_IN_PLACE, &meanEnergyPerAtomRef, 1, MPI_DOUBLE, MPI_SUM, MPI_COMM_WORLD);

    MPI_Allreduce(MPI_IN_PLACE, &meanEnergyPerAtomNnp, 1, MPI_DOUBLE, MPI_SUM, MPI_COMM_WORLD);

    MPI_Allreduce(MPI_IN_PLACE, &meanForceRef        , 1, MPI_DOUBLE, MPI_SUM, MPI_COMM_WORLD);

    MPI_Allreduce(MPI_IN_PLACE, &meanForceNnp        , 1, MPI_DOUBLE, MPI_SUM, MPI_COMM_WORLD);

    meanEnergyPerAtomRef /= numStructures;

    meanEnergyPerAtomNnp /= numStructures;

    meanForceRef /= 3 * numAtomsTotal;

    meanForceNnp /= 3 * numAtomsTotal;

    for (auto const& s : structures)

    {

        double ediffRef = s.energyRef / s.numAtoms - meanEnergyPerAtomRef;

        double ediffNnp = s.energy    / s.numAtoms - meanEnergyPerAtomNnp;

        sigmaEnergyPerAtomRef += ediffRef * ediffRef;

        sigmaEnergyPerAtomNnp += ediffNnp * ediffNnp;

        for (auto const& a : s.atoms)

        {

            double fdiffRef = a.fRef[0] - meanForceRef;

            double fdiffNnp = a.f   [0] - meanForceNnp;

            sigmaForceRef += fdiffRef * fdiffRef;

            sigmaForceNnp += fdiffNnp * fdiffNnp;

            fdiffRef = a.fRef[1] - meanForceRef;

            fdiffNnp = a.f   [1] - meanForceNnp;

            sigmaForceRef += fdiffRef * fdiffRef;

            sigmaForceNnp += fdiffNnp * fdiffNnp;

            fdiffRef = a.fRef[2] - meanForceRef;

            fdiffNnp = a.f   [2] - meanForceNnp;

            sigmaForceRef += fdiffRef * fdiffRef;

            sigmaForceNnp += fdiffNnp * fdiffNnp;

        }

    }

    MPI_Allreduce(MPI_IN_PLACE, &sigmaEnergyPerAtomRef, 1, MPI_DOUBLE, MPI_SUM, MPI_COMM_WORLD);

    MPI_Allreduce(MPI_IN_PLACE, &sigmaEnergyPerAtomNnp, 1, MPI_DOUBLE, MPI_SUM, MPI_COMM_WORLD);

    MPI_Allreduce(MPI_IN_PLACE, &sigmaForceRef        , 1, MPI_DOUBLE, MPI_SUM, MPI_COMM_WORLD);

    MPI_Allreduce(MPI_IN_PLACE, &sigmaForceNnp        , 1, MPI_DOUBLE, MPI_SUM, MPI_COMM_WORLD);

    sigmaEnergyPerAtomRef = sqrt(sigmaEnergyPerAtomRef / (numStructures - 1));

    sigmaEnergyPerAtomNnp = sqrt(sigmaEnergyPerAtomNnp / (numStructures - 1));

    sigmaForceRef = sqrt(sigmaForceRef / (3 * numAtomsTotal - 1));

    sigmaForceNnp = sqrt(sigmaForceNnp / (3 * numAtomsTotal - 1));

    log << "\n";

    log << strpr("Total number of structures : %zu\n", numStructures);

    log << strpr("Total number of atoms      : %zu\n", numAtomsTotal);

    log << "----------------------------------\n";

    log << "Reference data statistics:\n";

    log << "----------------------------------\n";

    log << strpr("Mean/sigma energy per atom : %16.8E   / %16.8E\n",

                 meanEnergyPerAtomRef,

                 sigmaEnergyPerAtomRef);

    log << strpr("Mean/sigma force           : %16.8E   / %16.8E\n",

                 meanForceRef,

                 sigmaForceRef);

    log << "----------------------------------\n";

    log << "Initial NNP prediction statistics:\n";

    log << "----------------------------------\n";

    log << strpr("Mean/sigma energy per atom : %16.8E   / %16.8E\n",

                 meanEnergyPerAtomNnp,

                 sigmaEnergyPerAtomNnp);

    log << strpr("Mean/sigma force           : %16.8E   / %16.8E\n",

                 meanForceNnp,

                 sigmaForceNnp);

    log << "----------------------------------\n";

    // Now set conversion quantities of Mode class.

    if (settings["normalize_data_set"] == "stats-only")

    {

        log << "Data set statistics computation completed, now make up for \n";

        log << "initially skipped normalization setup...\n";

        log << "\n";

        setupNormalization(false);

    }

    else if (settings["normalize_data_set"] == "ref")

    {

        log << "Normalization based on standard deviation of reference data "

               "selected:\n";

        log << "\n";

        log << "  mean(e_ref) = 0, sigma(e_ref) = sigma(F_ref) = 1\n";

        log << "\n";

        meanEnergy = meanEnergyPerAtomRef;

        convEnergy = 1.0 / sigmaEnergyPerAtomRef;

        if (useForcesLocal) convLength = sigmaForceRef / sigmaEnergyPerAtomRef;

        else convLength = 1.0;

        normalize = true;

    }

    else if (settings["normalize_data_set"] == "force")

    {

        if (!useForcesLocal)

        {

            throw runtime_error("ERROR: Selected normalization mode only "

                                "possible when forces are available.\n");

        }

        log << "Normalization based on standard deviation of reference forces "

               "and their\n";

        log << "initial prediction selected:\n";

        log << "\n";

        log << "  mean(e_ref) = 0, sigma(F_NNP) = sigma(F_ref) = 1\n";

        log << "\n";

        meanEnergy = meanEnergyPerAtomRef;

        convEnergy = sigmaForceNnp / sigmaForceRef;

        convLength = sigmaForceNnp;

        normalize = true;

    }

    else

    {

        throw runtime_error("ERROR: Unknown data set normalization mode.\n");

    }


    if (settings["normalize_data_set"] != "stats-only")

    {

        log << "Final conversion data:\n";

        log << strpr("Mean ref. energy per atom = %24.16E\n", meanEnergy);

        log << strpr("Conversion factor energy  = %24.16E\n", convEnergy);

        log << strpr("Conversion factor length  = %24.16E\n", convLength);

        log << "----------------------------------\n";

    }


    if ((myRank == 0) &&

        (settings["normalize_data_set"] != "stats-only"))

    {

        log << "\n";

        log << "Writing backup of original settings file to "

               "\"input.nn.bak\".\n";

        ofstream fileSettings;

        fileSettings.open("input.nn.bak");

        writeSettingsFile(&fileSettings);

        fileSettings.close();


        log << "\n";

        log << "Writing normalization data to settings file \"input.nn\".\n";

        string n1 = strpr("mean_energy %24.16E # nnp-train\n",

                          meanEnergyPerAtomRef);

        string n2 = strpr("conv_energy %24.16E # nnp-train\n",

                          convEnergy);

        string n3 = strpr("conv_length %24.16E # nnp-train\n",

                          convLength);

        // Check for existing normalization header and record line numbers

        // to replace.

        auto lines = settings.getSettingsLines();

        map<size_t, string> replace;

        for (size_t i = 0; i < lines.size(); ++i)

        {

            vector<string> sl = split(lines.at(i));

            if (sl.size() > 0)

            {

                if (sl.at(0) == "mean_energy") replace[i] = n1;

                if (sl.at(0) == "conv_energy") replace[i] = n2;

                if (sl.at(0) == "conv_length") replace[i] = n3;

            }

        }

        if (!replace.empty())

        {

            log << "WARNING: Preexisting normalization data was found and "

                   "replaced in original \"input.nn\" file.\n";

        }


        fileSettings.open("input.nn");

        if (replace.empty())

        {

            fileSettings << "#########################################"

                            "######################################\n";

            fileSettings << "# DATA SET NORMALIZATION\n";

            fileSettings << "#########################################"

                            "######################################\n";

            fileSettings << n1;

            fileSettings << n2;

            fileSettings << n3;

            fileSettings << "#########################################"

                            "######################################\n";

            fileSettings << "\n";

        }

        settings.writeSettingsFile(&fileSettings, replace);

        fileSettings.close();

    }


    // Now make up for left-out normalization setup, need to repeat entire

    // symmetry function setup.

    log << "\n";

    if (normalize)

    {

        log << "Silently repeating symmetry function setup...\n";

        log.silent = true;

        for (auto& e : elements) e.clearSymmetryFunctions();

        setupSymmetryFunctions();

#ifndef N2P2_FULL_SFD_MEMORY

        setupSymmetryFunctionMemory(false);

#endif

#ifndef N2P2_NO_SF_CACHE

        setupSymmetryFunctionCache();

#endif

#ifndef N2P2_NO_SF_GROUPS

        setupSymmetryFunctionGroups();

#endif

        setupSymmetryFunctionScaling();

        setupSymmetryFunctionStatistics(false, false, false, false);

        log.silent = false;

    }


    log << "*****************************************"

           "**************************************\n";


    return;

}


void Training::setupTraining()

{

    log << "\n";

    log << "*** SETUP: TRAINING *********************"

           "**************************************\n";

    log << "\n";


    if (nnpType == NNPType::HDNNP_4G ||

        nnpType == NNPType::HDNNP_Q)

    {

        log << strpr("Running stage %zu of training: ", stage);

        if      (stage == 1) log << "electrostatic NN fitting.\n";

        else if (stage == 2) log << "short-range NN fitting.\n";

        else throw runtime_error("\nERROR: Unknown training stage.\n");

    }


    if ( nnpType == NNPType::HDNNP_2G ||

        (nnpType == NNPType::HDNNP_4G && stage == 2) ||

        (nnpType == NNPType::HDNNP_Q  && stage == 2))

    {

        useForces = settings.keywordExists("use_short_forces");

        if (useForces)

        {

            log << "Forces will be used for training.\n";

            if (settings.keywordExists("force_weight"))

            {

                forceWeight = atof(settings["force_weight"].c_str());

            }

            else

            {

                log << "WARNING: Force weight not set, using default value.\n";

                forceWeight = 1.0;

            }

            log << strpr("Force update weight: %10.2E\n", forceWeight);

        }

        else

        {

            log << "Only energies will be used for training.\n";

        }

    }

    log << "Training will act on \"" << nns.at(nnId).name

        << "\" neural networks.\n";


    if (settings.keywordExists("main_error_metric"))

    {

        string k;

        if (settings["main_error_metric"] == "RMSEpa")

        {

            k = "energy"; if (p.exists(k)) p[k].displayMetric = "RMSEpa";

            k = "force";  if (p.exists(k)) p[k].displayMetric = "RMSE";

            k = "charge"; if (p.exists(k)) p[k].displayMetric = "RMSE";

        }

        else if (settings["main_error_metric"] == "RMSE")

        {

            k = "energy"; if (p.exists(k)) p[k].displayMetric = "RMSE";

            k = "force";  if (p.exists(k)) p[k].displayMetric = "RMSE";

            k = "charge"; if (p.exists(k)) p[k].displayMetric = "RMSE";

        }

        else if (settings["main_error_metric"] == "MAEpa")

        {

            k = "energy"; if (p.exists(k)) p[k].displayMetric = "MAEpa";

            k = "force";  if (p.exists(k)) p[k].displayMetric = "MAE";

            k = "charge"; if (p.exists(k)) p[k].displayMetric = "MAE";

        }

        else if (settings["main_error_metric"] == "MAE")

        {

            k = "energy"; if (p.exists(k)) p[k].displayMetric = "MAE";

            k = "force";  if (p.exists(k)) p[k].displayMetric = "MAE";

            k = "charge"; if (p.exists(k)) p[k].displayMetric = "MAE";

        }

        else

        {

            throw runtime_error("ERROR: Unknown error metric.\n");

        }

    }

    else

    {

        string k;

        k = "energy"; if (p.exists(k)) p[k].displayMetric = "RMSEpa";

        k = "force";  if (p.exists(k)) p[k].displayMetric = "RMSE";

        k = "charge"; if (p.exists(k)) p[k].displayMetric = "RMSE";

    }


    updaterType = (UpdaterType)atoi(settings["updater_type"].c_str());

    if (updaterType == UT_GD)

    {

        log << strpr("Weight update via gradient descent selected: "

                     "updaterType::UT_GD (%d)\n",

                     updaterType);

    }

    else if (updaterType == UT_KF)

    {

        log << strpr("Weight update via Kalman filter selected: "

                     "updaterType::UT_KF (%d)\n",

                     updaterType);

    }

    else if (updaterType == UT_LM)

    {

        throw runtime_error("ERROR: LM algorithm not yet implemented.\n");

        log << strpr("Weight update via Levenberg-Marquardt algorithm "

                     "selected: updaterType::UT_LM (%d)\n",

                     updaterType);

    }

    else

    {

        throw runtime_error("ERROR: Unknown updater type.\n");

    }


    parallelMode = (ParallelMode)atoi(settings["parallel_mode"].c_str());

    //if (parallelMode == PM_DATASET)

    //{

    //    log << strpr("Serial training selected: "

    //                 "ParallelMode::PM_DATASET (%d)\n",

    //                 parallelMode);

    //}

    if (parallelMode == PM_TRAIN_RK0)

    {

        log << strpr("Parallel training (rank 0 updates) selected: "

                     "ParallelMode::PM_TRAIN_RK0 (%d)\n",

                     parallelMode);

    }

    else if (parallelMode == PM_TRAIN_ALL)

    {

        log << strpr("Parallel training (all ranks update) selected: "

                     "ParallelMode::PM_TRAIN_ALL (%d)\n",

                     parallelMode);

    }

    else

    {

        throw runtime_error("ERROR: Unknown parallelization mode.\n");

    }


    jacobianMode = (JacobianMode)atoi(settings["jacobian_mode"].c_str());

    if (jacobianMode == JM_SUM)

    {

        log << strpr("Gradient summation only selected: "

                     "JacobianMode::JM_SUM (%d)\n", jacobianMode);

        log << "No Jacobi matrix, gradients of all training candidates are "

               "summed up instead.\n";

    }

    else if (jacobianMode == JM_TASK)

    {

        log << strpr("Per-task Jacobian selected: "

                     "JacobianMode::JM_TASK (%d)\n",

                     jacobianMode);

        log << "One Jacobi matrix row per MPI task is stored, within each "

               "task gradients are summed up.\n";

    }

    else if (jacobianMode == JM_FULL)

    {

        log << strpr("Full Jacobian selected: "

                     "JacobianMode::JM_FULL (%d)\n",

                     jacobianMode);

        log << "Each update candidate generates one Jacobi matrix "

               "row entry.\n";

    }

    else

    {

        throw runtime_error("ERROR: Unknown Jacobian mode.\n");

    }


    if (updaterType == UT_GD && jacobianMode != JM_SUM)

    {

        throw runtime_error("ERROR: Gradient descent methods can only be "

                            "combined with Jacobian mode JM_SUM.\n");

    }


    if (updateStrategy == US_ELEMENT && nnpType != NNPType::HDNNP_2G)

    {

        throw runtime_error("ERROR: US_ELEMENT only implemented for "

                            "HDNNP_2G.\n");

    }


    updateStrategy = (UpdateStrategy)atoi(settings["update_strategy"].c_str());

    // This section is pushed into a separate function because it's needed also

    // for testing purposes.

    initializeWeightsMemory(updateStrategy);

    // Now it is possible to fill the weights arrays with weight parameters

    // from the neural network.

    getWeights();


    // Set up update candidate selection modes.

    setupSelectionMode("all");

    for (auto k : pk) setupSelectionMode(k);


    log << "-----------------------------------------"

           "--------------------------------------\n";

    repeatedEnergyUpdates = settings.keywordExists("repeated_energy_update");

    if (useForces && repeatedEnergyUpdates)

    {

        throw runtime_error("ERROR: Repeated energy updates are not correctly"

                            " implemented at the moment.\n");

        //log << "After each force update an energy update for the\n";

        //log << "corresponding structure will be performed.\n";

    }


    freeMemory = !(settings.keywordExists("memorize_symfunc_results"));

    if (freeMemory)

    {

        log << "Symmetry function memory is cleared after each calculation.\n";

    }

    else

    {

        log << "Symmetry function memory is reused (HIGH MEMORY USAGE!).\n";

    }


    numEpochs = (size_t)atoi(settings["epochs"].c_str());

    log << strpr("Training will be stopped after %zu epochs.\n", numEpochs);


    // Set up how often comparison output files should be written.

    for (auto k : pk) setupFileOutput(k);

    // Set up how often weight files should be written.

    setupFileOutput("weights_epoch");

    // Set up how often neuron statistics files should be written.

    setupFileOutput("neuronstats");


    // Prepare training log header.

    writeTrainingLog = settings.keywordExists("write_trainlog");

    if (writeTrainingLog && myRank == 0)

    {

        if (nnpType == NNPType::HDNNP_4G ||

            nnpType == NNPType::HDNNP_Q)

        {

            trainingLogFileName += strpr(".stage-%zu", stage);

        }

        log << strpr("Training log with update information will be written to:"

                     " %s.\n", trainingLogFileName.c_str());

        trainingLog.open(trainingLogFileName.c_str());


        // File header.

        vector<string> title;

        vector<string> colName;

        vector<string> colInfo;

        vector<size_t> colSize;

        title.push_back("Detailed information on each weight update.");

        colSize.push_back(3);

        colName.push_back("U");

        colInfo.push_back("Update type (E = energy, F = force, Q = charge).");

        colSize.push_back(5);

        colName.push_back("epoch");

        colInfo.push_back("Current training epoch.");

        colSize.push_back(10);

        colName.push_back("count");

        colInfo.push_back("Update counter (Multiple lines with identical count"

                          " for multi-streaming!).");

        colSize.push_back(5);

        colName.push_back("proc");

        colInfo.push_back("MPI process providing this update candidate.");

        colSize.push_back(3);

        colName.push_back("tl");

        colInfo.push_back("Threshold loop counter.");

        colSize.push_back(10);

        colName.push_back("rmse_frac");

        colInfo.push_back("Update candidates error divided by this "

                          "epochs RMSE.");

        colSize.push_back(10);

        colName.push_back("s_ind_g");

        colInfo.push_back("Global structure index.");

        colSize.push_back(5);

        colName.push_back("s_ind");

        colInfo.push_back("Local structure index on this MPI process.");

        colSize.push_back(5);

        colName.push_back("a_ind");

        colInfo.push_back("Atom index.");

        colSize.push_back(2);

        colName.push_back("c");

        colInfo.push_back("Force component (0 = x, 1 = y, 2 = z).");

        appendLinesToFile(trainingLog,

                          createFileHeader(title, colSize, colName, colInfo));

    }


    // Compute number of updates and properties per update.

    log << "-----------------------------------------"

           "--------------------------------------\n";

    for (auto k : pk) setupUpdatePlan(k);

    if (p.exists("energy") && p.exists("force"))

    {

        Property& pe = p["energy"];

        Property& pf = p["force"];

        log << strpr("Energy to force ratio                        : "

                     "     1 : %5.1f\n",

                     static_cast<double>(

                         pf.numUpdates * pf.patternsPerUpdateGlobal)

                         / (pe.numUpdates * pe.patternsPerUpdateGlobal));

        log << strpr("Energy to force percentages                  : "

                     "%5.1f%% : %5.1f%%\n",

                     pe.numUpdates * pe.patternsPerUpdateGlobal * 100.0 /

                     (pe.numUpdates * pe.patternsPerUpdateGlobal

                     + pf.numUpdates * pf.patternsPerUpdateGlobal),

                     pf.numUpdates * pf.patternsPerUpdateGlobal * 100.0 /

                     (pe.numUpdates * pe.patternsPerUpdateGlobal

                     + pf.numUpdates * pf.patternsPerUpdateGlobal));

    }

    double totalUpdates = 0.0;

    for (auto k : pk) totalUpdates += p[k].numUpdates;

    log << "-----------------------------------------"

           "--------------------------------------\n";


    // Allocate error and Jacobian arrays.

    for (auto k : pk) allocateArrays(k);

    log << "-----------------------------------------"

           "--------------------------------------\n";


    // Set up new C++11 random number generator (TODO: move it!).

    rngGlobalNew.seed(gsl_rng_get(rngGlobal));

    rngNew.seed(gsl_rng_get(rng));


    // Updater setup.

    GradientDescent::DescentType descentType = GradientDescent::DT_FIXED;

    if (updaterType == UT_GD)

    {

        descentType = (GradientDescent::DescentType)

                      atoi(settings["gradient_type"].c_str());

    }

    KalmanFilter::KalmanType kalmanType = KalmanFilter::KT_STANDARD;

    if (updaterType == UT_KF)

    {

        kalmanType = (KalmanFilter::KalmanType)

                     atoi(settings["kalman_type"].c_str());

    }


    for (size_t i = 0; i < numUpdaters; ++i)

    {

        if ( (myRank == 0) || (parallelMode == PM_TRAIN_ALL) )

        {

            if (updaterType == UT_GD)

            {

                updaters.push_back(

                    (Updater*)new GradientDescent(numWeightsPerUpdater.at(i),

                                                  descentType));

            }

            else if (updaterType == UT_KF)

            {

                updaters.push_back(

                    (Updater*)new KalmanFilter(numWeightsPerUpdater.at(i),

                                               kalmanType));

            }

            updaters.back()->setState(&(weights.at(i).front()));

            updaters.back()->setupTiming(strpr("wupd%zu", i));

            updaters.back()->resetTimingLoop();

        }

    }

    if (updaters.size() > 0) hasUpdaters = true;

    else hasUpdaters = false;


    if (hasUpdaters && updaterType == UT_GD)

    {

        if (descentType == GradientDescent::DT_FIXED)

        {

            double const eta = atof(settings["gradient_eta"].c_str());

            for (size_t i = 0; i < numUpdaters; ++i)

            {

                GradientDescent* u =

                    dynamic_cast<GradientDescent*>(updaters.at(i));

                u->setParametersFixed(eta);

            }

        }

        if (descentType == GradientDescent::DT_ADAM)

        {

            double const eta = atof(settings["gradient_adam_eta"].c_str());

            double const beta1 = atof(settings["gradient_adam_beta1"].c_str());

            double const beta2 = atof(settings["gradient_adam_beta2"].c_str());

            double const eps = atof(settings["gradient_adam_epsilon"].c_str());

            for (size_t i = 0; i < numUpdaters; ++i)

            {

                GradientDescent* u =

                    dynamic_cast<GradientDescent*>(updaters.at(i));

                u->setParametersAdam(eta, beta1, beta2, eps);

            }

        }

    }

    else if (hasUpdaters && updaterType == UT_KF)

    {

        if (kalmanType == KalmanFilter::KT_STANDARD)

        {

            double const epsilon = atof(settings["kalman_epsilon"].c_str());

            double const q0      = atof(settings["kalman_q0"     ].c_str());

            double const qtau    = atof(settings["kalman_qtau"   ].c_str())

                                 / totalUpdates;

            log << "qtau is divided by number "

                   "of projected updates per epoch.\n";

            double const qmin    = atof(settings["kalman_qmin"   ].c_str());

            double const eta0    = atof(settings["kalman_eta"    ].c_str());

            double etatau  = 1.0;

            double etamax  = eta0;

            if (settings.keywordExists("kalman_etatau") &&

                settings.keywordExists("kalman_etamax"))

            {

                etatau = atof(settings["kalman_etatau"].c_str())

                       / totalUpdates;

                log << "etatau is divided by number "

                       "of projected updates per epoch.\n";

                etamax = atof(settings["kalman_etamax"].c_str());

            }

            for (size_t i = 0; i < updaters.size(); ++i)

            {

                KalmanFilter* u = dynamic_cast<KalmanFilter*>(updaters.at(i));

                u->setParametersStandard(epsilon,

                                         q0,

                                         qtau,

                                         qmin,

                                         eta0,

                                         etatau,

                                         etamax);

            }

        }

        else if (kalmanType == KalmanFilter::KT_FADINGMEMORY)

        {

            double const epsilon = atof(settings["kalman_epsilon"].c_str());

            double const q0      = atof(settings["kalman_q0"     ].c_str());

            double const qtau    = atof(settings["kalman_qtau"   ].c_str())

                                 / totalUpdates;

            log << "qtau is divided by number "

                   "of projected updates per epoch.\n";

            double const qmin   = atof(settings["kalman_qmin"].c_str());

            double const lambda =

                                 atof(settings["kalman_lambda_short"].c_str());

            //double const nu =

            //       pow(atof(settings["kalman_nue_short"].c_str()), numProcs);

            //log << "nu is exponentiated with the number of streams.\n";

            double const nu = atof(settings["kalman_nue_short"].c_str());

            for (size_t i = 0; i < updaters.size(); ++i)

            {

                KalmanFilter* u = dynamic_cast<KalmanFilter*>(updaters.at(i));

                u->setParametersFadingMemory(epsilon,

                                             q0,

                                             qtau,

                                             qmin,

                                             lambda,

                                             nu);

            }

        }

    }


    log << "-----------------------------------------"

           "--------------------------------------\n";

    for (size_t i = 0; i < updaters.size(); ++i)

    {

            if (updateStrategy == US_COMBINED)

            {

                log << strpr("Combined weight updater:\n");

            }

            else if (updateStrategy == US_ELEMENT)

            {

                log << strpr("Weight updater for element %2s :\n",

                             elements.at(i).getSymbol().c_str());

            }

            log << "-----------------------------------------"

                   "--------------------------------------\n";

            log << updaters.at(i)->info();

            if (updaterType == UT_KF)

            {

                log << "Note: During training loop the actual observation\n";

                log << "      size corresponds to error vector size:\n";

                for (auto k : pk)

                {

                    log << strpr("sizeObservation = %zu (%s updates)\n",

                                 p[k].error.at(i).size(), k.c_str());

                }

            }

            log << "-----------------------------------------"

                   "--------------------------------------\n";

    }


    log << strpr("TIMING Finished setup: %.2f seconds.\n",

                 sw["setup"].stop());

    log << "*****************************************"

           "**************************************\n";


    return;

}


vector<string> Training::setupNumericDerivCheck()

{

    log << "\n";

    log << "*** SETUP WEIGHT DERIVATIVES CHECK ******"

           "**************************************\n";

    log << "\n";


    log << "Weight derivatives will be checked for these properties:\n";

    for (auto k : pk) log << " - " + p[k].plural + "\n";

    log << "\n";


    if (nnpType == NNPType::HDNNP_2G)

    {

        nnId = "short";

        readNeuralNetworkWeights(nnId, "weights.%03zu.data");

    }

    else if ( (nnpType == NNPType::HDNNP_4G || nnpType == NNPType::HDNNP_Q) &&

               stage == 1)

    {

        nnId = "elec";

        readNeuralNetworkWeights(nnId, "weightse.%03zu.data");

    }

    else if ( (nnpType == NNPType::HDNNP_4G || nnpType == NNPType::HDNNP_Q) &&

               stage == 2)

    {

        nnId = "short";

        readNeuralNetworkWeights("elec", "weightse.%03zu.data");

        readNeuralNetworkWeights(nnId, "weights.%03zu.data");

    }

    initializeWeightsMemory();

    getWeights();


    log << "*****************************************"

           "**************************************\n";


    return pk;

}


void Training::calculateNeighborLists()

{

    sw["nl"].start();

    log << "\n";

    log << "*** CALCULATE NEIGHBOR LISTS ************"

           "**************************************\n";

    log << "\n";


#ifdef _OPENMP

    int num_threads = omp_get_max_threads();

    omp_set_num_threads(1);

    log << strpr("Temporarily disabling OpenMP parallelization: %d threads.\n",

                 omp_get_max_threads());

#endif

    log << "Calculating neighbor lists for all structures.\n";

    double maxCutoffRadiusPhys = maxCutoffRadius;

    if (normalize) maxCutoffRadiusPhys = maxCutoffRadius / convLength;

    // TODO: may not actually be cutoff (ewald real space cutoff is often

    // larger)

    if (nnpType != NNPType::HDNNP_4G)

        log << strpr("Cutoff radius for neighbor lists: %f\n",

                 maxCutoffRadiusPhys);

    double maxCutoffRadiusAllStructures = 0.0;

    for (vector<Structure>::iterator it = structures.begin();

         it != structures.end(); ++it)

    {

        // List only needs to be sorted for 4G

        if (nnpType == NNPType::HDNNP_4G)

        {

            it->calculateMaxCutoffRadiusOverall(

                                            ewaldSetup,

                                            screeningFunction.getOuter(),

                                            maxCutoffRadius);

            it->calculateNeighborList(maxCutoffRadius,cutoffs);


            if (it->maxCutoffRadiusOverall > maxCutoffRadiusAllStructures)

                maxCutoffRadiusAllStructures = it->maxCutoffRadiusOverall;

        }

        else

        {

            it->calculateNeighborList(maxCutoffRadius);

        }

    }

    if (normalize) maxCutoffRadiusAllStructures /= convLength;

    if (nnpType == NNPType::HDNNP_4G)

        log << strpr("Largest cutoff radius for neighbor lists: %f\n",

                     maxCutoffRadiusAllStructures);

#ifdef _OPENMP

    omp_set_num_threads(num_threads);

    log << strpr("Restoring OpenMP parallelization: max. %d threads.\n",

                 omp_get_max_threads());

#endif


    log << "-----------------------------------------"

           "--------------------------------------\n";

    log << strpr("TIMING Finished neighbor lists: %.2f seconds.\n",

                 sw["nl"].stop());

    log << "*****************************************"

           "**************************************\n";


    return;

}


void Training::calculateError(

                             map<string, pair<string, string>> const fileNames)

{

#ifdef _OPENMP

    int num_threads = omp_get_max_threads();

    omp_set_num_threads(1);

#endif

    vector<string> write;

    for (auto i : fileNames)

    {

        if (i.second.first.size() == 0 || i.second.second.size() == 0)

        {

            throw runtime_error("ERROR: No filename provided for comparison "

                                "files.\n");

        }

        write.push_back(i.first);

    }

    auto doWrite = [&write](string key){

                       return find(write.begin(),

                                   write.end(),

                                   key) != write.end();

                   };


    map<string, size_t> countTrain;

    map<string, size_t> countTest;

    for (auto k : pk) countTrain[k] = 0;

    for (auto k : pk) countTest[k]  = 0;


    map<string, ofstream> filesTrain;

    map<string, ofstream> filesTest;


    // Reset current error metrics.

    for (auto k : pk)

    {

        for (auto& m : p[k].errorTrain) m.second = 0.0;

        for (auto& m : p[k].errorTest) m.second = 0.0;

    }


    for (auto k : write)

    {

        filesTrain[k].open(strpr("%s.%04d",

                                 fileNames.at(k).first.c_str(),

                                 myRank).c_str());

        filesTest[k].open(strpr("%s.%04d",

                                fileNames.at(k).second.c_str(),

                                myRank).c_str());

        // File header.

        vector<string> header;

        if (myRank == 0)

        {

            vector<string> title;

            vector<string> colName;

            vector<string> colInfo;

            vector<size_t> colSize;

            if (k == "energy")

            {

                title.push_back("Energy comparison.");

                colSize.push_back(10);

                colName.push_back("index");

                colInfo.push_back("Structure index.");

                colSize.push_back(16);

                colName.push_back("Eref");

                colInfo.push_back("Reference potential energy per atom "

                                  "(training units).");

                colSize.push_back(16);

                colName.push_back("Ennp");

                colInfo.push_back("NNP potential energy per atom "

                                  "(training units).");

            }

            else if (k == "force")

            {

                title.push_back("Force comparison.");

                colSize.push_back(10);

                colName.push_back("index_s");

                colInfo.push_back("Structure index.");

                colSize.push_back(10);

                colName.push_back("index_a");

                colInfo.push_back("Atom index (x, y, z components in "

                                  "consecutive lines).");

                colSize.push_back(16);

                colName.push_back("Fref");

                colInfo.push_back("Reference force (training units).");

                colSize.push_back(16);

                colName.push_back("Fnnp");

                colInfo.push_back("NNP force (training units).");

            }

            else if (k == "charge")

            {

                title.push_back("Charge comparison.");

                colSize.push_back(10);

                colName.push_back("index_s");

                colInfo.push_back("Structure index.");

                colSize.push_back(10);

                colName.push_back("index_a");

                colInfo.push_back("Atom index.");

                colSize.push_back(16);

                colName.push_back("Qref");

                colInfo.push_back("Reference charge.");

                colSize.push_back(16);

                colName.push_back("Qnnp");

                colInfo.push_back("NNP charge.");

            }

            header = createFileHeader(title, colSize, colName, colInfo);

            appendLinesToFile(filesTrain.at(k), header);

            appendLinesToFile(filesTest.at(k), header);

        }

    }


    for (vector<Structure>::iterator it = structures.begin();

         it != structures.end(); ++it)

    {

#ifdef N2P2_NO_SF_GROUPS

        calculateSymmetryFunctions((*it), useForces);

#else

        calculateSymmetryFunctionGroups((*it), useForces);

#endif

        // TODO: Can we use evaluateNNP?

        if ( nnpType == Mode::NNPType::HDNNP_4G )

        {

            if ( stage == 1 )

            {

                calculateAtomicNeuralNetworks((*it), useForces, nnId);

                chargeEquilibration((*it), false);

            }

            else

            {

                if ( !it->hasCharges || (!it->hasAMatrix && useForces) )

                {

                    calculateAtomicNeuralNetworks((*it), useForces,

                                                    "elec");

                    chargeEquilibration((*it), useForces);

                }

                calculateAtomicNeuralNetworks((*it), useForces, "short");

                calculateEnergy((*it));

                if (useForces) calculateForces((*it));

            }

        }

        else

        {

            calculateAtomicNeuralNetworks((*it), useForces, nnId);

            calculateEnergy((*it));

            if (useForces) calculateForces((*it));

        }


        for (auto k : pk)

        {

            map<string, double>* error = nullptr;

            size_t* count = nullptr;

            ofstream* file = nullptr;

            if (it->sampleType == Structure::ST_TRAINING)

            {

                error = &(p[k].errorTrain);

                count = &(countTrain.at(k));

                if (doWrite(k)) file = &(filesTrain.at(k));

            }

            else if (it->sampleType == Structure::ST_TEST)

            {

                error = &(p[k].errorTest);

                count = &(countTest.at(k));

                if (doWrite(k)) file = &(filesTest.at(k));

            }


            it->updateError(k, *error, *count);

            if (doWrite(k))

            {

                if      (k == "energy") (*file) << it->getEnergyLine();

                else if (k == "force")

                {

                    for (auto l : it->getForcesLines()) (*file) << l;

                }

                else if (k == "charge")

                {

                    for (auto l : it->getChargesLines()) (*file) << l;

                }

            }

        }

        if (freeMemory) it->freeAtoms(true, maxCutoffRadius);

        it->clearElectrostatics();

    }


    for (auto k : pk)

    {

        collectError(k, p[k].errorTrain, countTrain.at(k));

        collectError(k, p[k].errorTest, countTest.at(k));

        if (doWrite(k))

        {

            filesTrain.at(k).close();

            filesTest.at(k).close();

            MPI_Barrier(comm);

            if (myRank == 0)

            {

                combineFiles(fileNames.at(k).first);

                combineFiles(fileNames.at(k).second);

            }

        }

    }


#ifdef _OPENMP

    omp_set_num_threads(num_threads);

#endif


    return;

}


void Training::calculateErrorEpoch()

{

    // Check whether property comparison files should be written for

    // this epoch.

    map<string, pair<string, string>> fileNames;


    for (auto const& ip : p)

    {

        string const& k = ip.first; // key

        Property const& d = ip.second; // data

        if (d.writeCompEvery > 0 &&

            (epoch % d.writeCompEvery == 0 || epoch <= d.writeCompAlways))

        {

            string middle;

            if      (k == "energy") middle = "points";

            else if (k == "force" ) middle = "forces";

            else if (k == "charge") middle = "charges";

            fileNames[k] = make_pair(strpr("train%s.%06zu.out",

                                           middle.c_str(), epoch),

                                     strpr("test%s.%06zu.out",

                                           middle.c_str(), epoch));

        }

    }


    // Calculate errors and write comparison files.

    calculateError(fileNames);


    return;

}


void Training::calculateChargeErrorVec( Structure const &s,

                                        Eigen::VectorXd &cVec,

                                        double          &cNorm)

{

    cVec.resize(s.numAtoms);

    for (size_t i = 0; i < s.numAtoms; ++i)

    {

        cVec(i) = s.atoms.at(i).charge - s.atoms.at(i).chargeRef;

    }

    cNorm = cVec.norm();

    return;

}


void Training::printHeader()

{

    string metric = "?";

    string peratom = "";


    log << "The training loop output covers different errors, update and\n";

    log << "timing information. The following quantities are organized\n";

    log << "according to the matrix scheme below:\n";

    log << "-------------------------------------------------------------------\n";

    log << "ep ........ Epoch.\n";

    for (auto k : pk)

    {

        string const& pmetric = p[k].displayMetric;

        if      (pmetric.find("RMSE") != pmetric.npos) metric = "RMSE";

        else if (pmetric.find("MAE")  != pmetric.npos) metric = "MAE";

        if      (pmetric.find("pa") != pmetric.npos) peratom = " per atom";

        else peratom = "";

        log << p[k].tiny << "_count ... Number of " << k << " updates.\n";

        log << p[k].tiny << "_train ... " << metric << " of training "

            << p[k].plural << peratom << ".\n";

        log << p[k].tiny << "_test .... " << metric << " of test     "

            << p[k].plural << peratom << ".\n";

        //log << p[k].tiny << "_time ........ Time for " << k << " updates "

        //                 << "(seconds).\n";

        log << p[k].tiny << "_pt ...... Percentage of time for " << k <<

                            " updates w.r.t. to t_train.\n";

    }

    log << "count ..... Total number of updates.\n";

    log << "train ..... Percentage of time for training.\n";

    log << "error ..... Percentage of time for error calculation.\n";

    log << "other ..... Percentage of time for other purposes.\n";

    log << "epoch ..... Total time for this epoch (seconds).\n";

    log << "total ..... Total time for all epochs (seconds).\n";

    log << "-------------------------------------------------------------------\n";

    for (auto k : pk)

    {

        log << strpr("%-6s", k.c_str())

            << strpr("  %5s", "ep")

            << strpr("  %7s", (p[k].tiny + "_count").c_str())

            << strpr("   %11s", (p[k].tiny + "_train").c_str())

            << strpr("   %11s", (p[k].tiny + "_test").c_str())

            << strpr("   %5s", (p[k].tiny + "_pt").c_str())

            << "\n";

    }

    log << strpr("%-6s", "timing")

        << strpr("  %5s", "ep")

        << strpr("  %7s", "count")

        << strpr("  %5s", "train")

        << strpr("  %5s", "error")

        << strpr("  %5s", "other")

        << strpr("  %9s", "epoch")

        << strpr("  %9s", "total")

        << "\n";

    log << "-------------------------------------------------------------------\n";


    return;

}


void Training::printEpoch()

{

    double timeLoop = sw["loop"].getLoop();

    double timeTrain = sw["train"].getLoop();

    size_t totalUpdates = 0;

    for (auto k : pk)

    {

        totalUpdates += p[k].countUpdates;

        double timeProp = sw[k].getLoop();

        string caps = k;

        for (auto& c : caps) c = toupper(c);

        log << strpr("%-6s", caps.c_str());

        log << strpr("  %5zu", epoch);

        log << strpr("  %7zu", p[k].countUpdates);

        if (normalize)

        {

            log << strpr("   %11.5E   %11.5E",

                         physical(k, p[k].errorTrain.at(p[k].displayMetric)),

                         physical(k, p[k].errorTest.at(p[k].displayMetric)));

        }

        else

        {

            log << strpr("   %11.5E   %11.5E",

                         p[k].errorTrain.at(p[k].displayMetric),

                         p[k].errorTest.at(p[k].displayMetric));

        }

        if (epoch == 0) log << strpr("   %5.1f", 0.0);

        else log << strpr("   %5.1f", timeProp / timeTrain * 100.0);

        log << "\n";

    }

    double timeOther = timeLoop;

    timeOther -= sw["error"].getLoop();

    timeOther -= sw["train"].getLoop();

    log << strpr("%-6s", "TIMING");

    log << strpr("  %5zu", epoch);

    log << strpr("  %7zu", totalUpdates);

    log << strpr("  %5.1f", sw["train"].getLoop() / timeLoop * 100.0);

    log << strpr("  %5.1f", sw["error"].getLoop() / timeLoop * 100.0);

    log << strpr("  %5.1f", timeOther / timeLoop * 100.0);

    log << strpr("  %9.2f", sw["loop"].getLoop());

    log << strpr("  %9.2f", sw["loop"].getTotal());

    log << "\n";


    return;

}


void Training::writeWeights(string const& nnName,

                            string const& fileNameFormat) const

{

    ofstream file;


    for (size_t i = 0; i < numElements; ++i)

    {

        string fileName = strpr(fileNameFormat.c_str(),

                                elements.at(i).getAtomicNumber());

        file.open(fileName.c_str());

        elements.at(i).neuralNetworks.at(nnName).writeConnections(file);

        file.close();

    }


    return;

}


void Training::writeWeightsEpoch() const

{

    if (writeWeightsEvery > 0 &&

        (epoch % writeWeightsEvery == 0 || epoch <= writeWeightsAlways))

    {

        string weightFileFormat = strpr(".%%03zu.%06d.out", epoch);

        if ( nnpType == NNPType::HDNNP_2G ||

            (nnpType == NNPType::HDNNP_4G && stage == 2) ||

            (nnpType == NNPType::HDNNP_Q  && stage == 2))

        {

            weightFileFormat = "weights" + weightFileFormat;

        }

        else if ((nnpType == NNPType::HDNNP_4G && stage == 1) ||

                 (nnpType == NNPType::HDNNP_Q  && stage == 1))

        {

            weightFileFormat = "weightse" + weightFileFormat;

        }

        writeWeights(nnId, weightFileFormat);

    }


    return;

}


void Training::writeHardness(string const& fileNameFormat) const

{

    ofstream file;


    for (size_t i = 0; i < numElements; ++i)

    {

        string fileName = strpr(fileNameFormat.c_str(),

                                elements.at(i).getAtomicNumber());

        file.open(fileName.c_str());

        double hardness = elements.at(i).getHardness();

        if (normalize) hardness = physical("hardness", hardness);

        file << hardness << endl;

        file.close();

    }


    return;

}


void Training::writeHardnessEpoch() const

{

    if (writeWeightsEvery > 0 &&

        (epoch % writeWeightsEvery == 0 || epoch <= writeWeightsAlways) &&

        nnpType == NNPType::HDNNP_4G && stage == 1)

    {

        string hardnessFileFormat = strpr(".%%03zu.%06d.out", epoch);

        hardnessFileFormat = "hardness" + hardnessFileFormat;

        writeHardness(hardnessFileFormat);

    }


    return;

}


void Training::writeLearningCurve(bool append, string const fileName) const

{

    ofstream file;

    string fileNameActual = fileName;

    if (nnpType == NNPType::HDNNP_4G ||

        nnpType == NNPType::HDNNP_Q)

    {

        fileNameActual += strpr(".stage-%zu", stage);

    }


    if (append) file.open(fileNameActual.c_str(), ofstream::app);

    else

    {

        file.open(fileNameActual.c_str());


        // File header.

        vector<string> title;

        vector<string> colName;

        vector<string> colInfo;

        vector<size_t> colSize;

        title.push_back("Learning curves for training properties:");

        for (auto k : pk)

        {

            title.push_back(" * " + p[k].plural);

        }

        colSize.push_back(10);

        colName.push_back("epoch");

        colInfo.push_back("Current epoch.");


        map<string, string> text;

        text["RMSEpa"] = "RMSE of %s %s per atom";

        text["RMSE"]   = "RMSE of %s %s";

        text["MAEpa"]  = "MAE of %s %s per atom";

        text["MAE"]    = "MAE of %s %s";


        for (auto k : pk)

        {

            for (auto m : p[k].errorMetrics)

            {

                colSize.push_back(16);

                colName.push_back(m + "_" + p[k].tiny + "train_pu");

                colInfo.push_back(strpr(

                                       (text[m] + " (physical units)").c_str(),

                                       "training",

                                       p[k].plural.c_str()));

                colSize.push_back(16);

                colName.push_back(m + "_" + p[k].tiny + "test_pu");

                colInfo.push_back(strpr(

                                       (text[m] + " (physical units)").c_str(),

                                       "test",

                                       p[k].plural.c_str()));

            }

        }

        if (normalize)

        {

            for (auto k : pk)

            {

                // Internal units only for energies, forces and charges.

                if (!(k == "energy" || k == "force" || k == "charge")) continue;

                for (auto m : p[k].errorMetrics)

                {

                    colSize.push_back(16);

                    colName.push_back(m + "_" + p[k].tiny + "train_iu");

                    colInfo.push_back(strpr(

                                       (text[m] + " (training units)").c_str(),

                                       "training",

                                       p[k].plural.c_str()));

                    colSize.push_back(16);

                    colName.push_back(m + "_" + p[k].tiny + "test_iu");

                    colInfo.push_back(strpr(

                                       (text[m] + " (training units)").c_str(),

                                       "test",

                                       p[k].plural.c_str()));

                }

            }

        }

        appendLinesToFile(file,

                          createFileHeader(title, colSize, colName, colInfo));

    }


    file << strpr("%10zu", epoch);

    if (normalize)

    {

        for (auto k : pk)

        {

            if (!(k == "energy" || k == "force" || k == "charge")) continue;

            for (auto m : p[k].errorMetrics)

            {

                file << strpr(" %16.8E %16.8E",

                              physical(k, p[k].errorTrain.at(m)),

                              physical(k, p[k].errorTest.at(m)));

            }

        }

    }

    for (auto k : pk)

    {

        for (auto m : p[k].errorMetrics)

        {

            file << strpr(" %16.8E %16.8E",

                          p[k].errorTrain.at(m),

                          p[k].errorTest.at(m));

        }

    }

    file << "\n";

    file.flush();

    file.close();


    return;

}


void Training::writeNeuronStatistics(string const& id,

                                     string const& fileName) const

{

    ofstream file;

    if (myRank == 0)

    {

        file.open(fileName.c_str());


        // File header.

        vector<string> title;

        vector<string> colName;

        vector<string> colInfo;

        vector<size_t> colSize;

        title.push_back("Statistics for individual neurons of network \""

                        + id + "\" gathered during RMSE calculation.");

        colSize.push_back(10);

        colName.push_back("element");

        colInfo.push_back("Element index.");

        colSize.push_back(10);

        colName.push_back("neuron");

        colInfo.push_back("Neuron number.");

        colSize.push_back(10);

        colName.push_back("count");

        colInfo.push_back("Number of neuron value computations.");

        colSize.push_back(16);

        colName.push_back("min");

        colInfo.push_back("Minimum neuron value encounterd.");

        colSize.push_back(16);

        colName.push_back("max");

        colInfo.push_back("Maximum neuron value encounterd.");

        colSize.push_back(16);

        colName.push_back("mean");

        colInfo.push_back("Mean neuron value.");

        colSize.push_back(16);

        colName.push_back("sigma");

        colInfo.push_back("Standard deviation of neuron value.");

        appendLinesToFile(file,

                          createFileHeader(title, colSize, colName, colInfo));

    }


    for (size_t i = 0; i < numElements; ++i)

    {

        size_t n = elements.at(i).neuralNetworks.at(id).getNumNeurons();

        vector<long>   count(n, 0);

        vector<double> min(n, 0.0);

        vector<double> max(n, 0.0);

        vector<double> mean(n, 0.0);

        vector<double> sigma(n, 0.0);

        elements.at(i).neuralNetworks.at(id).

            getNeuronStatistics(&(count.front()),

                                &(min.front()),

                                &(max.front()),

                                &(mean.front()),

                                &(sigma.front()));

        // Collect statistics from all processors on proc 0.

        if (myRank == 0)

        {

            MPI_Reduce(MPI_IN_PLACE, &(count.front()), n, MPI_LONG  , MPI_SUM, 0, comm);

            MPI_Reduce(MPI_IN_PLACE, &(min.front())  , n, MPI_DOUBLE, MPI_MIN, 0, comm);

            MPI_Reduce(MPI_IN_PLACE, &(max.front())  , n, MPI_DOUBLE, MPI_MAX, 0, comm);

            MPI_Reduce(MPI_IN_PLACE, &(mean.front()) , n, MPI_DOUBLE, MPI_SUM, 0, comm);

            MPI_Reduce(MPI_IN_PLACE, &(sigma.front()), n, MPI_DOUBLE, MPI_SUM, 0, comm);

        }

        else

        {

            MPI_Reduce(&(count.front()), &(count.front()), n, MPI_LONG  , MPI_SUM, 0, comm);

            MPI_Reduce(&(min.front())  , &(min.front())  , n, MPI_DOUBLE, MPI_MIN, 0, comm);

            MPI_Reduce(&(max.front())  , &(max.front())  , n, MPI_DOUBLE, MPI_MAX, 0, comm);

            MPI_Reduce(&(mean.front()) , &(mean.front()) , n, MPI_DOUBLE, MPI_SUM, 0, comm);

            MPI_Reduce(&(sigma.front()), &(sigma.front()), n, MPI_DOUBLE, MPI_SUM, 0, comm);

        }

        if (myRank == 0)

        {

            for (size_t j = 0; j < n; ++j)

            {

                size_t m = count.at(j);

                sigma.at(j) = sqrt((m * sigma.at(j) - mean.at(j) * mean.at(j))

                            / (m * (m - 1)));

                mean.at(j) /= m;

                file << strpr("%10d %10d %10d %16.8E %16.8E %16.8E %16.8E\n",

                              i + 1,

                              j + 1,

                              count[j],

                              min[j],

                              max[j],

                              mean[j],

                              sigma[j]);

            }

        }

    }


    if (myRank == 0)

    {

        file.close();

    }


    return;

}


void Training::writeNeuronStatisticsEpoch() const

{

    if (writeNeuronStatisticsEvery > 0 &&

        (epoch % writeNeuronStatisticsEvery == 0

        || epoch <= writeNeuronStatisticsAlways))

    {

        string fileName = strpr("neuron-stats.%s.%06zu.out",

                                nnId.c_str(), epoch);

        if (nnpType == NNPType::HDNNP_4G ||

            nnpType == NNPType::HDNNP_Q)

        {

            fileName += strpr(".stage-%zu", stage);

        }

        writeNeuronStatistics(nnId, fileName);

    }


    return;

}


void Training::resetNeuronStatistics()

{

    for (vector<Element>::iterator it = elements.begin();

         it != elements.end(); ++it)

    {

        for (auto& nn : it->neuralNetworks) nn.second.resetNeuronStatistics();

    }

    return;

}


void Training::writeUpdaterStatus(bool         append,

                                  string const fileNameFormat) const

{

    ofstream file;

    string fileNameFormatActual = fileNameFormat;

    if (nnpType == NNPType::HDNNP_4G ||

        nnpType == NNPType::HDNNP_Q)

    {

        fileNameFormatActual += strpr(".stage-%zu", stage);

    }


    for (size_t i = 0; i < numUpdaters; ++i)

    {

        string fileName;

        if (updateStrategy == US_COMBINED)

        {

            fileName = strpr(fileNameFormatActual.c_str(), 0);

        }

        else if (updateStrategy == US_ELEMENT)

        {

            fileName = strpr(fileNameFormatActual.c_str(),

                             elementMap.atomicNumber(i));

        }

        if (append) file.open(fileName.c_str(), ofstream::app);

        else

        {

            file.open(fileName.c_str());

            appendLinesToFile(file, updaters.at(i)->statusHeader());

        }

        file << updaters.at(i)->status(epoch);

        file.close();

    }


    return;

}


void Training::sortUpdateCandidates(string const& property)

{

    // Update error for all structures.

    for (auto& uc : p[property].updateCandidates)

    {

        if (property == "energy")

        {

            Structure const& s = structures.at(uc.s);

            uc.error = fabs((s.energyRef - s.energy) / s.numAtoms);

        }

        else if (property == "force")

        {

            Structure const& s = structures.at(uc.s);

            uc.error = 0.0;

            for (auto &sc : uc.subCandidates)

            {

                Atom const& ai = s.atoms.at(sc.a);

                sc.error = fabs(ai.fRef[sc.c] - ai.f[sc.c]);

                uc.error += sc.error;

            }

            uc.error /= uc.subCandidates.size();

        }

        else if (property == "charge")

        {

            Structure const& s = structures.at(uc.s);

            uc.error = 0.0;

            for (auto const& a : s.atoms)

            {

                uc.error = fabs(a.chargeRef - a.charge);

            }

            uc.error /= s.numAtoms;

        }

    }

    // Sort update candidates list.

    sort(p[property].updateCandidates.begin(),

         p[property].updateCandidates.end());


    for (auto &uc : p[property].updateCandidates)

    {

        if (uc.subCandidates.size() > 0)

            sort(uc.subCandidates.begin(),

                uc.subCandidates.end());

    }


    // Reset current position.

    p[property].posUpdateCandidates = 0;

    for (auto &uc : p[property].updateCandidates)

    {

        uc.posSubCandidates = 0;

    }


    return;

}


void Training::shuffleUpdateCandidates(string const& property)

{

    shuffle(p[property].updateCandidates.begin(),

            p[property].updateCandidates.end(),

            rngNew);


    for (auto &uc : p[property].updateCandidates)

    {

        if (uc.subCandidates.size() > 0)

            shuffle(uc.subCandidates.begin(),

                uc.subCandidates.end(),

                rngNew);

    }


    // Reset current position.

    p[property].posUpdateCandidates = 0;

     for (auto &uc : p[property].updateCandidates)

    {

        uc.posSubCandidates = 0;

    }


    return;

}


void Training::setEpochSchedule()

{

    // Clear epoch schedule.

    epochSchedule.clear();

    vector<int>(epochSchedule).swap(epochSchedule);


    // Grow schedule vector by each property's number of desired updates.

    // Fill this array looping in reverse direction for backward compatibility.

    //for (size_t i = 0; i < pk.size(); ++i)

    for (int i = pk.size() - 1; i >= 0; --i)

    {

        epochSchedule.insert(epochSchedule.end(), p[pk.at(i)].numUpdates, i);

    }


    // Return if there is only a single training property.

    if (pk.size() == 1) return;


    // Now shuffle the schedule to get a random sequence.

    shuffle(epochSchedule.begin(), epochSchedule.end(), rngGlobalNew);


    //for (size_t i = 0; i < epochSchedule.size(); ++i)

    //{

    //    log << strpr("%zu %zu\n", i, epochSchedule.at(i));

    //}


    return;

}


void Training::checkSelectionMode()

{

    for (auto k : pk)

    {

        if (p[k].selectionModeSchedule.find(epoch)

            != p[k].selectionModeSchedule.end())

        {

            p[k].selectionMode = p[k].selectionModeSchedule[epoch];

            if (epoch != 0)

            {

                string message = "INFO   Switching selection mode for "

                                 "property \"" + k + "\" to ";

                if (p[k].selectionMode == SM_RANDOM)

                {

                    message += strpr("SM_RANDOM (%d).\n", p[k].selectionMode);

                }

                else if (p[k].selectionMode == SM_SORT)

                {

                    message += strpr("SM_SORT (%d).\n", p[k].selectionMode);

                }

                else if (p[k].selectionMode == SM_THRESHOLD)

                {

                    message += strpr("SM_THRESHOLD (%d).\n",

                                     p[k].selectionMode);

                }

                log << message;

            }

        }

    }


    return;

}


void Training::loop()

{

    sw["loop"].start();

    log << "\n";

    log << "*** TRAINING LOOP ***********************"

           "**************************************\n";

    log << "\n";

    printHeader();


    // Calculate initial RMSE and write comparison files.

    sw["error"].start();

    calculateErrorEpoch();

    sw["error"].stop();


    // Write initial weights to files.

    if (myRank == 0) writeWeightsEpoch();


    // Write initial hardness to files (checks for corresponding type and

    // stage)

    if (myRank == 0) writeHardnessEpoch();


    // Write learning curve.

    if (myRank == 0) writeLearningCurve(false);


    // Write updater status to file.

    if (myRank == 0) writeUpdaterStatus(false);


    // Write neuron statistics.

    writeNeuronStatisticsEpoch();


    // Print timing information.

    sw["loop"].stop();

    printEpoch();


    // Check if training should be continued.

    while (advance())

    {

        sw["loop"].start();


        // Increment epoch counter.

        epoch++;

        log << "------\n";


        // Reset update counters.

        for (auto k : pk) p[k].countUpdates = 0;


        // Check if selection mode should be changed in this epoch.

        checkSelectionMode();


        // Sort or shuffle update candidates.

        for (auto k : pk)

        {

            if (p[k].selectionMode == SM_SORT) sortUpdateCandidates(k);

            else shuffleUpdateCandidates(k);

        }


        // Determine epoch update schedule.

        setEpochSchedule();


        // Perform property updates according to schedule.

        sw["train"].start();

        for (auto i : epochSchedule)

        {

            string property = pk.at(i);

            update(property);

            p[property].countUpdates++;

        }

        sw["train"].stop();


        // Reset neuron statistics.

        resetNeuronStatistics();


        // Calculate errors and write comparison files.

        sw["error"].start();

        calculateErrorEpoch();

        sw["error"].stop();


        // Write weights to files.

        if (myRank == 0) writeWeightsEpoch();


        // Write hardness to files (checks for corresponding type and stage).

        if (myRank == 0) writeHardnessEpoch();


        // Append to learning curve.

        if (myRank == 0) writeLearningCurve(true);


        // Write updater status to file.

        if (myRank == 0) writeUpdaterStatus(true);


        // Write neuron statistics.

        writeNeuronStatisticsEpoch();


        // Print error overview and timing information.

        sw["loop"].stop();

        printEpoch();


        if (myRank == 0) writeTimingData(epoch != 1);

    }


    log << "-----------------------------------------"

           "--------------------------------------\n";

    log << strpr("TIMING Training loop finished: %.2f seconds.\n",

                 sw["loop"].getTotal());

    log << "*****************************************"

           "**************************************\n";


    return;

}


void Training::update(string const& property)

{

    // Shortcuts.

    string const& k = property; // Property key.

    Property& pu = p[k]; // Update property.

    // Start watch for error and jacobian computation, reset loop timer if

    // first update in this epoch.

    bool newLoop = pu.countUpdates == 0;

    sw[k].start(newLoop);

    sw[k + "_err"].start(newLoop);


#ifdef _OPENMP

    int num_threads = omp_get_max_threads();

    omp_set_num_threads(1);

#endif


    // PART 1: Find update candidate, compute error fractions and derivatives


    size_t batchSize = pu.taskBatchSize;

    if (batchSize == 0) batchSize = pu.patternsPerUpdate;

    bool derivatives = false;

    if (k == "force") derivatives = true;


    vector<size_t> thresholdLoopCount(batchSize, 0);

    vector<double> currentRmseFraction(batchSize, 0.0);


    bool useSubCandidates = (k == "force" && nnpType == NNPType::HDNNP_4G);


    // Either consider only UpdateCandidates or SubCandidates

    vector<size_t> currentUpdateCandidates(batchSize, 0);


    for (size_t i = 0; i < numUpdaters; ++i)

    {

        fill(pu.error.at(i).begin(), pu.error.at(i).end(), 0.0);

        fill(pu.jacobian.at(i).begin(), pu.jacobian.at(i).end(), 0.0);

    }


    // Loop over (mini-)batch size.

    for (size_t b = 0; b < batchSize; ++b)

    {

        UpdateCandidate* c = NULL; // Actual current update candidate.

        SubCandidate* sC = NULL; // Actual current sub candidate.

        size_t* posCandidates = NULL; // position of sub or update candidate.

        size_t indexBest = 0; // Index of best update candidate so far.

        double rmseFractionBest = 0.0; // RMSE of best update candidate so far.


        // For SM_THRESHOLD need to loop until candidate's RMSE is above

        // threshold. Other modes don't loop here.

        size_t trials = 1;

        if (pu.selectionMode == SM_THRESHOLD) trials = pu.rmseThresholdTrials;

        size_t il = 0;

        for (il = 0; il < trials; ++il)

        {

            // Restart position index if necessary.

            if (pu.posUpdateCandidates >= pu.updateCandidates.size())

            {

                pu.posUpdateCandidates = 0;

            }

            //log << strpr("pos %zu b %zu size %zu\n", pu.posUpdateCandidates, b, currentUpdateCandidates.size());

            // Set current update candidate.

            c = &(pu.updateCandidates.at(pu.posUpdateCandidates));


            if (c->posSubCandidates >= c->subCandidates.size())

                c->posSubCandidates = 0;

            // Shortcut for position counter of interest.

            if (useSubCandidates)

            {

                posCandidates = &(c->posSubCandidates);

                sC = &(c->subCandidates.at(c->posSubCandidates));

            }

            else

            {

                posCandidates = &(pu.posUpdateCandidates);

                if (c->subCandidates.size() > 0)

                    sC = &(c->subCandidates.front());

            }


            // Keep update candidates (for logging later).

            currentUpdateCandidates.at(b) = *posCandidates;


            // Shortcut for current structure.

            Structure& s = structures.at(c->s);

            // Calculate symmetry functions (if results are already stored

            // these functions will return immediately).

#ifdef NOSFGROUPS

            calculateSymmetryFunctions(s, derivatives);

#else

            calculateSymmetryFunctionGroups(s, derivatives);

#endif

            // For SM_THRESHOLD calculate RMSE of update candidate.

            if (pu.selectionMode == SM_THRESHOLD)

            {

                if (k == "energy")

                {

                    if (nnpType == NNPType::HDNNP_2G)

                    {

                        calculateAtomicNeuralNetworks(s, derivatives);

                        calculateEnergy(s);

                        currentRmseFraction.at(b) =

                            fabs(s.energyRef - s.energy)

                            / (s.numAtoms * pu.errorTrain.at("RMSEpa"));

                    }

                    // Assume stage 2.

                    else if (nnpType == NNPType::HDNNP_4G)

                    {

                        if (!s.hasCharges)

                        {

                            calculateAtomicNeuralNetworks(s, derivatives, "elec");

                            chargeEquilibration(s, derivatives);

                        }

                        calculateAtomicNeuralNetworks(s, derivatives, "short");

                        calculateEnergy(s);

                        currentRmseFraction.at(b) = fabs(s.energyRef - s.energy)

                                                  / (s.numAtoms

                                                     * pu.errorTrain.at("RMSEpa"));

                    }

                    else if (nnpType == NNPType::HDNNP_Q)

                    {

                        // TODO: Reuse already present charge-NN data and

                        // compute only short-NN energy contributions.

                        throw runtime_error("ERROR: Not implemented.\n");

                    }

                }

                else if (k == "force")

                {

                    if (nnpType == NNPType::HDNNP_2G)

                    {

                        calculateAtomicNeuralNetworks(s, derivatives);

                        calculateForces(s);

                        Atom const& a = s.atoms.at(sC->a);

                        currentRmseFraction.at(b) =

                            fabs(a.fRef[sC->c]

                                    - a.f[sC->c])

                            / pu.errorTrain.at("RMSE");

                    }

                    // Assume stage 2.

                    else if (nnpType == NNPType::HDNNP_4G)

                    {

                        if (!s.hasAMatrix)

                        {

                            calculateAtomicNeuralNetworks(s, derivatives, "elec");

                            chargeEquilibration(s, derivatives);

                        }

                        calculateAtomicNeuralNetworks(s, derivatives, "short");

                        calculateForces(s);

                        Atom const& a = s.atoms.at(sC->a);

                        currentRmseFraction.at(b) =

                            fabs(a.fRef[sC->c]

                                    - a.f[sC->c])

                            / pu.errorTrain.at("RMSE");

                    }

                    else if (nnpType == NNPType::HDNNP_Q)

                    {

                        // TODO: Reuse already present charge-NN data and

                        // compute only short-NN force contributions.

                        throw runtime_error("ERROR: Not implemented.\n");

                    }

                }

                else if (k == "charge")

                {

                    // Assume stage 1.

                    if (nnpType == NNPType::HDNNP_4G)

                    {

                        calculateAtomicNeuralNetworks(s, derivatives, "");

                        chargeEquilibration(s, false);

                        Eigen::VectorXd QError;

                        double QErrorNorm;

                        calculateChargeErrorVec(s, QError, QErrorNorm);

                        currentRmseFraction.at(b) =

                            QErrorNorm / sqrt(s.numAtoms)

                            / pu.errorTrain.at("RMSE");

                    }

                    else if (nnpType == NNPType::HDNNP_Q)

                    {

                        // Compute only charge-NN

                        Atom& a = s.atoms.at(sC->a);

                        NeuralNetwork& nn =

                            elements.at(a.element).neuralNetworks.at(nnId);

                        nn.setInput(&(a.G.front()));

                        nn.propagate();

                        nn.getOutput(&(a.charge));

                        currentRmseFraction.at(b) =

                            fabs(a.chargeRef - a.charge)

                            / pu.errorTrain.at("RMSE");

                    }

                }

                // If force RMSE is above threshold stop loop immediately.

                if (currentRmseFraction.at(b) > pu.rmseThreshold)

                {

                    // Increment position in update candidate list.

                    (*posCandidates)++;

                    break;

                }

                // If loop continues, free memory and remember best candidate

                // so far.

                if (freeMemory)

                {

                    s.freeAtoms(true, maxCutoffRadius);

                }

                if (!useSubCandidates) s.clearElectrostatics();


                if (currentRmseFraction.at(b) > rmseFractionBest)

                {

                    rmseFractionBest = currentRmseFraction.at(b);

                    indexBest = *posCandidates;

                }

                // Increment position in update candidate list.

                (*posCandidates)++;

            }

            // Break loop for all selection modes but SM_THRESHOLD.

            else if (pu.selectionMode == SM_RANDOM ||

                     pu.selectionMode == SM_SORT)

            {

                // Increment position in update candidate list.

                (*posCandidates)++;

                break;

            }

        }

        thresholdLoopCount.at(b) = il;


        // If loop was not stopped because of a proper update candidate found

        // (RMSE above threshold) use best candidate during iteration.

        if (pu.selectionMode == SM_THRESHOLD && il == trials)

        {

            // Set best candidate.

            currentUpdateCandidates.at(b) = indexBest;

            currentRmseFraction.at(b) = rmseFractionBest;

            // Need to calculate the symmetry functions again, maybe results

            // were not stored.

            Structure& s = structures.at(c->s);

#ifdef N2P2_NO_SF_GROUPS

            calculateSymmetryFunctions(s, derivatives);

#else

            calculateSymmetryFunctionGroups(s, derivatives);

#endif

        }


        // If new update candidate, determine number of subcandidates needed

        // before going to next candidate.

        if (useSubCandidates)

        {

            if (pu.countGroupedSubCand == 0)

            {

                pu.numGroupedSubCand = static_cast<size_t>(

                                c->subCandidates.size() * pu.epochFraction);

                MPI_Allreduce(  MPI_IN_PLACE, &(pu.numGroupedSubCand), 1,

                                MPI_INT, MPI_MIN, comm);

                //if (myRank == 0)

                //    cout << "group size: " << pu.numGroupedSubCand << endl;

            }

            pu.countGroupedSubCand++;

        }


        // PART 2: Compute error vector and Jacobian


        Structure& s = structures.at(c->s);

        // Temporary storage for derivative contributions of atoms (dXdc stores

        // dEdc, dFdc or dQdc for energy, force or charge update, respectively.

        vector<vector<double>> dXdc;

        dXdc.resize(numElements);

        // Temporary storage vector for charge errors in structure

        Eigen::VectorXd QError;

        QError.resize(s.numAtoms);

        double QErrorNorm = 0;

        for (size_t i = 0; i < numElements; ++i)

        {

            size_t n = elements.at(i).neuralNetworks.at(nnId)

                       .getNumConnections();

            dXdc.at(i).resize(n, 0.0);

        }

        // Precalculate offset in Jacobian array.

        size_t iu = 0;

        vector<size_t> offset(numElements, 0);

        for (size_t i = 0; i < numElements; ++i)

        {

            if (updateStrategy == US_ELEMENT) iu = i;

            else iu = 0;

            if (parallelMode == PM_TRAIN_ALL && jacobianMode != JM_SUM)

            {

                // Offset from multiple streams/tasks

                offset.at(i) += pu.offsetPerTask.at(myRank)

                              * numWeightsPerUpdater.at(iu);

                //log << strpr("%zu os 1: %zu ", i, offset.at(i));

            }

            if (jacobianMode == JM_FULL)

            {

                // Offset from batch training (multiple contributions from

                // single stream/task

                offset.at(i) += b * numWeightsPerUpdater.at(iu);

                //log << strpr("%zu os 2: %zu ", i, offset.at(i));

            }

            if (updateStrategy == US_COMBINED)

            {

                // Offset from multiple elements in contribution from single

                // stream/task

                offset.at(i) += weightsOffset.at(i);

                //log << strpr("%zu os 3: %zu", i, offset.at(i));

            }

            //log << strpr(" %zu final os: %zu\n", i, offset.at(i));

        }

        // Now compute Jacobian.

        if (k == "energy")

        {

            if (nnpType == NNPType::HDNNP_2G || nnpType == NNPType::HDNNP_4G)

            {

                if (nnpType == NNPType::HDNNP_4G && !s.hasCharges)

                {

                   calculateAtomicNeuralNetworks(s, derivatives, "elec");

                   chargeEquilibration(s, derivatives);

                }

                // Loop over atoms and calculate atomic energy contributions.

                for (vector<Atom>::iterator it = s.atoms.begin();

                     it != s.atoms.end(); ++it)

                {

                    size_t i = it->element;

                    NeuralNetwork& nn = elements.at(i).neuralNetworks.at(nnId);


                    // TODO: This part should simplify with improved NN class.

                    for (size_t j = 0; j < it->G.size(); ++j)

                    {

                        nn.setInput(j, it->G.at(j));

                    }

                    if (nnpType == NNPType::HDNNP_4G)

                        nn.setInput(it->G.size(), it->charge);

                    nn.propagate();

                    nn.getOutput(&(it->energy));

                    // Compute derivative of output node with respect to all

                    // neural network connections (weights + biases).

                    nn.calculateDEdc(&(dXdc.at(i).front()));

                    // Finally sum up Jacobian.

                    if (updateStrategy == US_ELEMENT) iu = i;

                    else iu = 0;

                    for (size_t j = 0; j < dXdc.at(i).size(); ++j)

                    {

                        pu.jacobian.at(iu).at(offset.at(i) + j) +=

                            dXdc.at(i).at(j);

                    }

                }

            }

            // Assume stage 2.

            else if (nnpType == NNPType::HDNNP_Q)

            {

                // TODO: Lots of stuff.

                throw runtime_error("ERROR: Not implemented.\n");

            }

        }

        else if (k == "force")

        {

            if (nnpType == NNPType::HDNNP_2G || nnpType == NNPType::HDNNP_4G )

            {

                if (nnpType == NNPType::HDNNP_4G)

                {

                    if (!s.hasAMatrix)

                    {

                       calculateAtomicNeuralNetworks(s, derivatives, "elec");

                       chargeEquilibration(s, derivatives);

                    }

                    s.calculateDQdr(vector<size_t>{sC->a},

                                    vector<size_t>{sC->c},

                                    maxCutoffRadius,

                                    elements);

                }


                // Loop over atoms and calculate atomic energy contributions.

                for (vector<Atom>::iterator it = s.atoms.begin();

                     it != s.atoms.end(); ++it)

                {

                    // For force update save derivative of symmetry function

                    // with respect to coordinate.

#ifndef N2P2_FULL_SFD_MEMORY

                    collectDGdxia((*it), sC->a, sC->c);


                    if (nnpType == NNPType::HDNNP_4G)

                    {

                        double dQdxia = s.atoms.at(sC->a).dQdr.at(it->index)[sC->c];

                        dGdxia.back() = dQdxia;

                    }

#else

                    it->collectDGdxia(sC->a, sC->c, maxCutoffRadius);

                    if (nnpType == NNPType::HDNNP_4G)

                    {

                        double dQdxia = s.atoms.at(sC->a).dQdr.at(it->index)[sC->c];

                        it->dGdxia.resize(it->G.size() + 1);

                        it->dGdxia.back() = dQdxia;

                    }

#endif

                    size_t i = it->element;

                    NeuralNetwork& nn = elements.at(i).neuralNetworks.at(nnId);

                    // TODO: This part should simplify with improved NN class.

                    for (size_t j = 0; j < it->G.size(); ++j)

                    {

                        nn.setInput(j, it->G.at(j));

                    }

                    if (nnpType == NNPType::HDNNP_4G)

                        nn.setInput(it->G.size(), it->charge);

                    nn.propagate();

                    if (derivatives) nn.calculateDEdG(&((it->dEdG).front()));

                    nn.getOutput(&(it->energy));


                    // Compute derivative of output node with respect to all

                    // neural network connections (weights + biases).

#ifndef N2P2_FULL_SFD_MEMORY

                    nn.calculateDFdc(&(dXdc.at(i).front()),

                                     &(dGdxia.front()));

#else

                    nn.calculateDFdc(&(dXdc.at(i).front()),

                                     &(it->dGdxia.front()));

#endif

                    // Finally sum up Jacobian.

                    if (updateStrategy == US_ELEMENT) iu = i;

                    else iu = 0;

                    for (size_t j = 0; j < dXdc.at(i).size(); ++j)

                    {

                        pu.jacobian.at(iu).at(offset.at(i) + j) +=

                            dXdc.at(i).at(j);

                    }

                }


            }

            // Assume stage 2.

            else if (nnpType == NNPType::HDNNP_Q)

            {

                // TODO: Lots of stuff.

                throw runtime_error("ERROR: Not implemented.\n");

            }

        }

        else if (k == "charge")

        {

            // Assume stage 1.

            if (nnpType == NNPType::HDNNP_4G)

            {


                // Vector for storing all atoms dChi/dc

                vector<vector<double>> dChidc;

                dChidc.resize(s.numAtoms);

                for (size_t k = 0; k < s.numAtoms; ++k)

                {

                    Atom& ak = s.atoms.at(k);

                    size_t n = elements.at(ak.element).neuralNetworks.at(nnId)

                               .getNumConnections();

                    dChidc.at(k).resize(n, 0.0);


                    NeuralNetwork& nn =

                        elements.at(ak.element).neuralNetworks.at(nnId);

                    nn.setInput(&(ak.G.front()));

                    nn.propagate();

                    nn.getOutput(&(ak.chi));

                    // Compute derivative of output node with respect to all

                    // neural network connections (weights + biases).

                    nn.calculateDEdc(&(dChidc.at(k).front()));

                    if (normalize)

                    {

                        ak.chi = normalized("negativity", ak.chi);

                        for (auto& dChidGi : ak.dChidG)

                            dChidGi = normalized("negativity", dChidGi);

                        for (auto& dChidci : dChidc.at(k))

                            dChidci = normalized("negativity", dChidci);

                    }


                }

                chargeEquilibration(s, false);


                vector<Eigen::VectorXd> dQdChi;

                s.calculateDQdChi(dQdChi);

                vector<Eigen::VectorXd> dQdJ;

                s.calculateDQdJ(dQdJ);


                calculateChargeErrorVec(s, QError, QErrorNorm);


                if (QErrorNorm != 0)

                {

                    // Finally sum up Jacobian.

                    for (size_t i = 0; i < s.numAtoms; ++i)

                    {

                        // weights

                        for (size_t k = 0; k < s.numAtoms; ++k)

                        {

                            size_t l = s.atoms.at(k).element;

                            for (size_t j = 0; j < dChidc.at(k).size(); ++j)

                            {

                                // 1 / QErrorNorm * (Q-Qref) * dQ/dChi * dChi/dc

                                pu.jacobian.at(0).at(offset.at(l) + j) +=

                                    1.0 / QErrorNorm * QError(i)

                                    * dQdChi.at(k)(i) * dChidc.at(k).at(j);

                            }

                        }

                        // hardness (actually h, where J=h^2)

                        for (size_t k = 0; k < numElements; ++k)

                        {

                            size_t n = elements.at(k).neuralNetworks.at(nnId)

                                       .getNumConnections();

                            pu.jacobian.at(0).at(offset.at(k) + n) +=

                                        1.0 / QErrorNorm

                                        * QError(i) * dQdJ.at(k)(i) * 2

                                        * sqrt(elements.at(k).getHardness());

                        }

                    }

                }

            }


            else if (nnpType == NNPType::HDNNP_Q)

            {

                // Shortcut to selected atom.

                Atom& a = s.atoms.at(sC->a);

                size_t i = a.element;

                NeuralNetwork& nn = elements.at(i).neuralNetworks.at(nnId);

                nn.setInput(&(a.G.front()));

                nn.propagate();

                nn.getOutput(&(a.charge));

                // Compute derivative of output node with respect to all

                // neural network connections (weights + biases).

                nn.calculateDEdc(&(dXdc.at(i).front()));

                // Finally sum up Jacobian.

                if (updateStrategy == US_ELEMENT) iu = i;

                else iu = 0;

                for (size_t j = 0; j < dXdc.at(i).size(); ++j)

                {

                    pu.jacobian.at(iu).at(offset.at(i) + j) +=

                        dXdc.at(i).at(j);

                }

            }

        }


        // Sum up total potential energy or calculate force.

        if (k == "energy")

        {

            calculateEnergy(s);

            currentRmseFraction.at(b) = fabs(s.energyRef - s.energy)

                                      / (s.numAtoms

                                         * pu.errorTrain.at("RMSEpa"));

        }

        else if (k == "force")

        {

            calculateForces(s);

            Atom const& a = s.atoms.at(sC->a);

            currentRmseFraction.at(b) = fabs(a.fRef[sC->c] - a.f[sC->c])

                                      / pu.errorTrain.at("RMSE");

        }

        else if (k == "charge")

        {

            if (nnpType == NNPType::HDNNP_4G)

            {

                currentRmseFraction.at(b) = QErrorNorm / sqrt(s.numAtoms)

                                            / pu.errorTrain.at("RMSE");

            }

            else

            {

                Atom const& a = s.atoms.at(sC->a);

                currentRmseFraction.at(b) = fabs(a.chargeRef - a.charge)

                                          / pu.errorTrain.at("RMSE");

            }

        }


        // Now symmetry function memory is not required any more for this

        // update.

        if (freeMemory) s.freeAtoms(true, maxCutoffRadius);

        if (nnpType == NNPType::HDNNP_4G && !useSubCandidates)

            s.clearElectrostatics();


        // Precalculate offset in error array.

        size_t offset2 = 0;

        if (parallelMode == PM_TRAIN_ALL && jacobianMode != JM_SUM)

        {

            offset2 += pu.offsetPerTask.at(myRank);

            //log << strpr("os 4: %zu ", offset2);

        }

        if (jacobianMode == JM_FULL)

        {

            offset2 += b;

            //log << strpr("os 5: %zu ", offset2);

        }

        //log << strpr(" final os: %zu\n", offset2);


        // Compute error vector (depends on update strategy).

        if (updateStrategy == US_COMBINED)

        {

            if (k == "energy")

            {

                pu.error.at(0).at(offset2) += s.energyRef - s.energy;

            }

            else if (k == "force")

            {

                Atom const& a = s.atoms.at(sC->a);

                pu.error.at(0).at(offset2) +=  a.fRef[sC->c] - a.f[sC->c];

            }

            else if (k == "charge")

            {

                if (nnpType == NNPType::HDNNP_4G)

                    pu.error.at(0).at(offset2) = -QErrorNorm;

                else

                {

                    Atom const& a = s.atoms.at(sC->a);

                    pu.error.at(0).at(offset2) += a.chargeRef - a.charge;

                }

            }

        }

        else if (updateStrategy == US_ELEMENT)

        {

            for (size_t i = 0; i < numUpdaters; ++i)

            {

                if (k == "energy")

                {

                    pu.error.at(i).at(offset2) += (s.energyRef - s.energy)

                                               * s.numAtomsPerElement.at(i)

                                               / s.numAtoms;

                }

                else if (k == "force")

                {

                    Atom const& a = s.atoms.at(sC->a);

                    pu.error.at(i).at(offset2) += (a.fRef[sC->c] - a.f[sC->c])

                                               * a.numNeighborsPerElement.at(i)

                                               / a.numNeighbors;

                }

                else if (k == "charge")

                {

                    if (nnpType == NNPType::HDNNP_4G)

                    {

                        throw runtime_error("ERROR: US_ELEMENT not implemented"

                                " for HDNNP_4G.\n");

                    }

                    Atom const& a = s.atoms.at(sC->a);

                    pu.error.at(i).at(offset2) += a.chargeRef - a.charge;

                }

            }

        }

    }


    // Apply force update weight to error and Jacobian.

    if (k == "force")

    {

        for (size_t i = 0; i < numUpdaters; ++i)

        {

            for (size_t j = 0; j < pu.error.at(i).size(); ++j)

            {

                pu.error.at(i).at(j) *= forceWeight;

            }

            for (size_t j = 0; j < pu.jacobian.at(i).size(); ++j)

            {

                pu.jacobian.at(i).at(j) *= forceWeight;

            }

        }

    }

    sw[k + "_err"].stop();


    // PART 3: Communicate error and Jacobian.


    sw[k + "_com"].start(newLoop);

    if (jacobianMode == JM_SUM)

    {

        if (parallelMode == PM_TRAIN_RK0)

        {

            for (size_t i = 0; i < numUpdaters; ++i)

            {

                if (myRank == 0) MPI_Reduce(MPI_IN_PLACE             , &(pu.error.at(i).front()), 1, MPI_DOUBLE, MPI_SUM, 0, comm);

                else             MPI_Reduce(&(pu.error.at(i).front()), &(pu.error.at(i).front()), 1, MPI_DOUBLE, MPI_SUM, 0, comm);

                if (myRank == 0) MPI_Reduce(MPI_IN_PLACE                , &(pu.jacobian.at(i).front()), numWeightsPerUpdater.at(i), MPI_DOUBLE, MPI_SUM, 0, comm);

                else             MPI_Reduce(&(pu.jacobian.at(i).front()), &(pu.jacobian.at(i).front()), numWeightsPerUpdater.at(i), MPI_DOUBLE, MPI_SUM, 0, comm);

            }

        }

        else if (parallelMode == PM_TRAIN_ALL)

        {

            for (size_t i = 0; i < numUpdaters; ++i)

            {

                MPI_Allreduce(MPI_IN_PLACE, &(pu.error.at(i).front()), 1, MPI_DOUBLE, MPI_SUM, comm);

                MPI_Allreduce(MPI_IN_PLACE, &(pu.jacobian.at(i).front()), numWeightsPerUpdater.at(i), MPI_DOUBLE, MPI_SUM, comm);

            }

        }

    }

    else if (jacobianMode == JM_TASK)

    {

        if (parallelMode == PM_TRAIN_RK0)

        {

            for (size_t i = 0; i < numUpdaters; ++i)

            {

                if (myRank == 0) MPI_Gather(MPI_IN_PLACE             , 1, MPI_DOUBLE, &(pu.error.at(i).front()),  1, MPI_DOUBLE, 0, comm);

                else             MPI_Gather(&(pu.error.at(i).front()), 1, MPI_DOUBLE, NULL                     ,  1, MPI_DOUBLE, 0, comm);

                if (myRank == 0) MPI_Gather(MPI_IN_PLACE                , numWeightsPerUpdater.at(i), MPI_DOUBLE, &(pu.jacobian.at(i).front()), numWeightsPerUpdater.at(i), MPI_DOUBLE, 0, comm);

                else             MPI_Gather(&(pu.jacobian.at(i).front()), numWeightsPerUpdater.at(i), MPI_DOUBLE, NULL                        , numWeightsPerUpdater.at(i), MPI_DOUBLE, 0, comm);

            }

        }

        else if (parallelMode == PM_TRAIN_ALL)

        {

            for (size_t i = 0; i < numUpdaters; ++i)

            {

                MPI_Allgather(MPI_IN_PLACE, 1, MPI_DOUBLE, &(pu.error.at(i).front()),  1, MPI_DOUBLE, comm);

                MPI_Allgather(MPI_IN_PLACE, numWeightsPerUpdater.at(i), MPI_DOUBLE, &(pu.jacobian.at(i).front()), numWeightsPerUpdater.at(i), MPI_DOUBLE, comm);

            }

        }

    }

    else if (jacobianMode == JM_FULL)

    {

        if (parallelMode == PM_TRAIN_RK0)

        {

            for (size_t i = 0; i < numUpdaters; ++i)

            {

                if (myRank == 0) MPI_Gatherv(MPI_IN_PLACE             , 0                          , MPI_DOUBLE, &(pu.error.at(i).front()), &(pu.errorsPerTask.front()), &(pu.offsetPerTask.front()), MPI_DOUBLE, 0, comm);

                else             MPI_Gatherv(&(pu.error.at(i).front()), pu.errorsPerTask.at(myRank), MPI_DOUBLE, NULL                     , NULL                       , NULL                       , MPI_DOUBLE, 0, comm);

                if (myRank == 0) MPI_Gatherv(MPI_IN_PLACE                , 0                                 , MPI_DOUBLE, &(pu.jacobian.at(i).front()), &(pu.weightsPerTask.at(i).front()), &(pu.offsetJacobian.at(i).front()), MPI_DOUBLE, 0, comm);

                else             MPI_Gatherv(&(pu.jacobian.at(i).front()), pu.weightsPerTask.at(i).at(myRank), MPI_DOUBLE, NULL                        , NULL                              , NULL                              , MPI_DOUBLE, 0, comm);

            }

        }

        else if (parallelMode == PM_TRAIN_ALL)

        {

            for (size_t i = 0; i < numUpdaters; ++i)

            {

                MPI_Allgatherv(MPI_IN_PLACE, 0, MPI_DOUBLE, &(pu.error.at(i).front()), &(pu.errorsPerTask.front()), &(pu.offsetPerTask.front()), MPI_DOUBLE, comm);

                MPI_Allgatherv(MPI_IN_PLACE, 0, MPI_DOUBLE, &(pu.jacobian.at(i).front()), &(pu.weightsPerTask.at(i).front()), &(pu.offsetJacobian.at(i).front()), MPI_DOUBLE, comm);

            }

        }

    }

    sw[k + "_com"].stop();


    // PART 4: Perform weight update and apply new weights.


    sw[k + "_upd"].start(newLoop);

#ifdef _OPENMP

    omp_set_num_threads(num_threads);

#endif

    // Loop over all updaters.

    for (size_t i = 0; i < updaters.size(); ++i)

    {

        updaters.at(i)->setError(&(pu.error.at(i).front()),

                                 pu.error.at(i).size());

        updaters.at(i)->setJacobian(&(pu.jacobian.at(i).front()),

                                    pu.error.at(i).size());

        if (updaterType == UT_KF)

        {

            KalmanFilter* kf = dynamic_cast<KalmanFilter*>(updaters.at(i));

            kf->setSizeObservation(pu.error.at(i).size());

        }

        updaters.at(i)->update();

    }

    countUpdates++;


    // Redistribute weights to all MPI tasks.

    if (parallelMode == PM_TRAIN_RK0)

    {

        for (size_t i = 0; i < numUpdaters; ++i)

        {

            MPI_Bcast(&(weights.at(i).front()), weights.at(i).size(), MPI_DOUBLE, 0, comm);

        }

    }


    // Set new weights in neural networks.

    setWeights();

    sw[k + "_upd"].stop();


    // PART 5: Communicate candidates and RMSE fractions and write log.


    sw[k + "_log"].start(newLoop);

    if (writeTrainingLog)

    {

        vector<int>    procUpdateCandidate;

        vector<size_t> indexStructure;

        vector<size_t> indexStructureGlobal;

        vector<size_t> indexAtom;

        vector<size_t> indexCoordinate;


        vector<int> currentUpdateCandidatesPerTask;

        vector<int> currentUpdateCandidatesOffset;

        int myCurrentUpdateCandidates = currentUpdateCandidates.size();


        if (myRank == 0)

        {

            currentUpdateCandidatesPerTask.resize(numProcs, 0);

            currentUpdateCandidatesPerTask.at(0) = myCurrentUpdateCandidates;

        }

        if (myRank == 0) MPI_Gather(MPI_IN_PLACE                , 1, MPI_INT, &(currentUpdateCandidatesPerTask.front()),  1, MPI_INT, 0, comm);

        else             MPI_Gather(&(myCurrentUpdateCandidates), 1, MPI_INT, NULL                                     ,  1, MPI_INT, 0, comm);


        if (myRank == 0)

        {

            int totalUpdateCandidates = 0;

            for (size_t i = 0; i < currentUpdateCandidatesPerTask.size(); ++i)

            {

                currentUpdateCandidatesOffset.push_back(totalUpdateCandidates);

                totalUpdateCandidates += currentUpdateCandidatesPerTask.at(i);

            }

            procUpdateCandidate.resize(totalUpdateCandidates, 0);

            indexStructure.resize(totalUpdateCandidates, 0);

            indexStructureGlobal.resize(totalUpdateCandidates, 0);

            indexAtom.resize(totalUpdateCandidates, 0);

            indexCoordinate.resize(totalUpdateCandidates, 0);

            // Increase size of this vectors (only rank 0).

            currentRmseFraction.resize(totalUpdateCandidates, 0.0);

            thresholdLoopCount.resize(totalUpdateCandidates, 0.0);

        }

        else

        {

            procUpdateCandidate.resize(myCurrentUpdateCandidates, 0);

            indexStructure.resize(myCurrentUpdateCandidates, 0);

            indexStructureGlobal.resize(myCurrentUpdateCandidates, 0);

            indexAtom.resize(myCurrentUpdateCandidates, 0);

            indexCoordinate.resize(myCurrentUpdateCandidates, 0);

        }

        for (int i = 0; i < myCurrentUpdateCandidates; ++i)

        {

            procUpdateCandidate.at(i) = myRank;

            UpdateCandidate* c = NULL;

            SubCandidate* sC = NULL;

            if (useSubCandidates)

            {

                c = &(pu.updateCandidates.at(pu.posUpdateCandidates));

                sC = &(c->subCandidates.at(currentUpdateCandidates.at(i)));

            }

            else

            {

                c = &(pu.updateCandidates.at(currentUpdateCandidates.at(i)));

                if (c->subCandidates.size() > 0)

                    sC = &(c->subCandidates.front());

            }

            indexStructure.at(i) = c->s;

            indexStructureGlobal.at(i) = structures.at(c->s).index;

            if (useSubCandidates)

            {

                indexAtom.at(i) = sC->a;

                indexCoordinate.at(i) = sC->c;

            }

        }

        if (myRank == 0)

        {

            MPI_Gatherv(MPI_IN_PLACE, 0, MPI_DOUBLE, &(currentRmseFraction.front()) , &(currentUpdateCandidatesPerTask.front()), &(currentUpdateCandidatesOffset.front()), MPI_DOUBLE, 0, comm);

            MPI_Gatherv(MPI_IN_PLACE, 0, MPI_SIZE_T, &(thresholdLoopCount.front())  , &(currentUpdateCandidatesPerTask.front()), &(currentUpdateCandidatesOffset.front()), MPI_SIZE_T, 0, comm);

            MPI_Gatherv(MPI_IN_PLACE, 0, MPI_INT   , &(procUpdateCandidate.front()) , &(currentUpdateCandidatesPerTask.front()), &(currentUpdateCandidatesOffset.front()), MPI_INT   , 0, comm);

            MPI_Gatherv(MPI_IN_PLACE, 0, MPI_SIZE_T, &(indexStructure.front())      , &(currentUpdateCandidatesPerTask.front()), &(currentUpdateCandidatesOffset.front()), MPI_SIZE_T, 0, comm);

            MPI_Gatherv(MPI_IN_PLACE, 0, MPI_SIZE_T, &(indexStructureGlobal.front()), &(currentUpdateCandidatesPerTask.front()), &(currentUpdateCandidatesOffset.front()), MPI_SIZE_T, 0, comm);

            MPI_Gatherv(MPI_IN_PLACE, 0, MPI_SIZE_T, &(indexAtom.front())           , &(currentUpdateCandidatesPerTask.front()), &(currentUpdateCandidatesOffset.front()), MPI_SIZE_T, 0, comm);

            MPI_Gatherv(MPI_IN_PLACE, 0, MPI_SIZE_T, &(indexCoordinate.front())     , &(currentUpdateCandidatesPerTask.front()), &(currentUpdateCandidatesOffset.front()), MPI_SIZE_T, 0, comm);

        }

        else

        {

            MPI_Gatherv(&(currentRmseFraction.front()) , myCurrentUpdateCandidates, MPI_DOUBLE, NULL, NULL, NULL, MPI_DOUBLE, 0, comm);

            MPI_Gatherv(&(thresholdLoopCount.front())  , myCurrentUpdateCandidates, MPI_SIZE_T, NULL, NULL, NULL, MPI_SIZE_T, 0, comm);

            MPI_Gatherv(&(procUpdateCandidate.front()) , myCurrentUpdateCandidates, MPI_INT   , NULL, NULL, NULL, MPI_INT   , 0, comm);

            MPI_Gatherv(&(indexStructure.front())      , myCurrentUpdateCandidates, MPI_SIZE_T, NULL, NULL, NULL, MPI_SIZE_T, 0, comm);

            MPI_Gatherv(&(indexStructureGlobal.front()), myCurrentUpdateCandidates, MPI_SIZE_T, NULL, NULL, NULL, MPI_SIZE_T, 0, comm);

            MPI_Gatherv(&(indexAtom.front())           , myCurrentUpdateCandidates, MPI_SIZE_T, NULL, NULL, NULL, MPI_SIZE_T, 0, comm);

            MPI_Gatherv(&(indexCoordinate.front())     , myCurrentUpdateCandidates, MPI_SIZE_T, NULL, NULL, NULL, MPI_SIZE_T, 0, comm);

        }


        if (myRank == 0)

        {

            for (size_t i = 0; i < procUpdateCandidate.size(); ++i)

            {

                if (k == "energy")

                {

                    addTrainingLogEntry(procUpdateCandidate.at(i),

                                        thresholdLoopCount.at(i),

                                        currentRmseFraction.at(i),

                                        indexStructureGlobal.at(i),

                                        indexStructure.at(i));

                }

                else if (k == "force")

                {

                    addTrainingLogEntry(procUpdateCandidate.at(i),

                                        thresholdLoopCount.at(i),

                                        currentRmseFraction.at(i),

                                        indexStructureGlobal.at(i),

                                        indexStructure.at(i),

                                        indexAtom.at(i),

                                        indexCoordinate.at(i));

                }

                else if (k == "charge")

                {

                    addTrainingLogEntry(procUpdateCandidate.at(i),

                                        thresholdLoopCount.at(i),

                                        currentRmseFraction.at(i),

                                        indexStructureGlobal.at(i),

                                        indexStructure.at(i),

                                        indexAtom.at(i));

                }

            }

        }

    }

    sw[k + "_log"].stop();


    // Need to go to next update candidate after numGroupedSubCand is reached.

    if (pu.countGroupedSubCand >= pu.numGroupedSubCand && useSubCandidates)

    {

        pu.countGroupedSubCand = 0;

        pu.numGroupedSubCand = 0;

        UpdateCandidate& c = pu.updateCandidates.at(pu.posUpdateCandidates);

        structures.at(c.s).clearElectrostatics(true);

        pu.posUpdateCandidates++;

    }


    sw[k].stop();


    return;

}


double Training::getSingleWeight(size_t element, size_t index)

{

    getWeights();


    return weights.at(element).at(index);

}


void Training::setSingleWeight(size_t element, size_t index, double value)

{

    weights.at(element).at(index) = value;

    setWeights();


    return;

}


vector<


vector<double>> Training::calculateWeightDerivatives(Structure* structure)

{

    Structure& s = *structure;

#ifdef N2P2_NO_SF_GROUPS

    calculateSymmetryFunctions(s, false);

#else

    calculateSymmetryFunctionGroups(s, false);

#endif


    vector<vector<double> > dEdc;

    vector<vector<double> > dedc;

    dEdc.resize(numElements);

    dedc.resize(numElements);

    for (size_t i = 0; i < numElements; ++i)

    {

        size_t n = elements.at(i).neuralNetworks.at("short")

                   .getNumConnections();

        dEdc.at(i).resize(n, 0.0);

        dedc.at(i).resize(n, 0.0);

    }

    for (vector<Atom>::iterator it = s.atoms.begin();

         it != s.atoms.end(); ++it)

    {

        size_t i = it->element;

        NeuralNetwork& nn = elements.at(i).neuralNetworks.at("short");

        nn.setInput(&((it->G).front()));

        nn.propagate();

        nn.getOutput(&(it->energy));

        nn.calculateDEdc(&(dedc.at(i).front()));

        for (size_t j = 0; j < dedc.at(i).size(); ++j)

        {

            dEdc.at(i).at(j) += dedc.at(i).at(j);

        }

    }


    return dEdc;

}


// Doxygen requires namespace prefix for arguments...

vector<


vector<double>> Training::calculateWeightDerivatives(Structure*  structure,

                                                      std::size_t atom,

                                                      std::size_t component)

{

    Structure& s = *structure;

#ifdef N2P2_NO_SF_GROUPS

    calculateSymmetryFunctions(s, true);

#else

    calculateSymmetryFunctionGroups(s, true);

#endif

    // TODO: Is charge equilibration necessary here?


    vector<vector<double> > dFdc;

    vector<vector<double> > dfdc;

    dFdc.resize(numElements);

    dfdc.resize(numElements);

    for (size_t i = 0; i < numElements; ++i)

    {

        size_t n = elements.at(i).neuralNetworks.at("short")

                   .getNumConnections();

        dFdc.at(i).resize(n, 0.0);

        dfdc.at(i).resize(n, 0.0);

    }

    for (vector<Atom>::iterator it = s.atoms.begin();

         it != s.atoms.end(); ++it)

    {

#ifndef N2P2_FULL_SFD_MEMORY

        collectDGdxia((*it), atom, component);

#else

        it->collectDGdxia(atom, component, maxCutoffRadius);

#endif

        size_t i = it->element;

        NeuralNetwork& nn = elements.at(i).neuralNetworks.at("short");

        nn.setInput(&((it->G).front()));

        // TODO: what about charge neuron for 4G?

        nn.propagate();

        nn.getOutput(&(it->energy));

#ifndef N2P2_FULL_SFD_MEMORY

        nn.calculateDFdc(&(dfdc.at(i).front()), &(dGdxia.front()));

#else

        nn.calculateDFdc(&(dfdc.at(i).front()), &(it->dGdxia.front()));

#endif

        for (size_t j = 0; j < dfdc.at(i).size(); ++j)

        {

            dFdc.at(i).at(j) += dfdc.at(i).at(j);

        }

    }


    return dFdc;

}


void Training::setTrainingLogFileName(string fileName)

{

    trainingLogFileName = fileName;


    return;

}


size_t Training::getNumConnections(string id) const

{

    size_t n = 0;

    for (auto const& e : elements)

    {

        n += e.neuralNetworks.at(id).getNumConnections();

    }


    return n;

}


vector<size_t> Training::getNumConnectionsPerElement(string id) const

{

    vector<size_t> npe;

    for (auto const& e : elements)

    {

        npe.push_back(e.neuralNetworks.at(id).getNumConnections());

    }


    return npe;

}


vector<size_t> Training::getConnectionOffsets(string id) const

{

    vector<size_t> offset;

    size_t n = 0;

    for (auto const& e : elements)

    {

        offset.push_back(n);

        n += e.neuralNetworks.at(id).getNumConnections();

    }


    return offset;

}


void Training::dPdc(string                  property,

                    Structure&              structure,

                    vector<vector<double>>& dPdc)

{

    auto npe = getNumConnectionsPerElement();

    auto off = getConnectionOffsets();

    dPdc.clear();


    if (property == "energy")

    {

        dPdc.resize(1);

        dPdc.at(0).resize(getNumConnections(), 0.0);

        for (auto const& a : structure.atoms)

        {

            size_t e = a.element;

            NeuralNetwork& nn = elements.at(e).neuralNetworks.at(nnId);

            nn.setInput(a.G.data());

            nn.propagate();

            vector<double> tmp(npe.at(e), 0.0);

            nn.calculateDEdc(tmp.data());

            for (size_t j = 0; j < tmp.size(); ++j)

            {

                dPdc.at(0).at(off.at(e) + j) += tmp.at(j);

            }

        }

    }

    else if (property == "force")

    {

        dPdc.resize(3 * structure.numAtoms);

        size_t count = 0;

        for (size_t ia = 0; ia < structure.numAtoms; ++ia)

        {

            for (size_t ixyz = 0; ixyz < 3; ++ixyz)

            {

                dPdc.at(count).resize(getNumConnections(), 0.0);

                for (auto& a : structure.atoms)

                {

#ifndef N2P2_FULL_SFD_MEMORY

                    collectDGdxia(a, ia, ixyz);

#else

                    a.collectDGdxia(ia, ixyz);

#endif

                    size_t e = a.element;

                    NeuralNetwork& nn = elements.at(e).neuralNetworks.at(nnId);

                    nn.setInput(a.G.data());

                    nn.propagate();

                    nn.calculateDEdG(a.dEdG.data());

                    nn.getOutput(&(a.energy));

                    vector<double> tmp(npe.at(e), 0.0);

#ifndef N2P2_FULL_SFD_MEMORY

                    nn.calculateDFdc(tmp.data(), dGdxia.data());

#else

                    nn.calculateDFdc(tmp.data(), a.dGdxia.data());

#endif

                    for (size_t j = 0; j < tmp.size(); ++j)

                    {

                        dPdc.at(count).at(off.at(e) + j) += tmp.at(j);

                    }

                }

                count++;

            }

        }

    }

    else

    {

        throw runtime_error("ERROR: Weight derivatives not implemented for "

                            "property \"" + property + "\".\n");

    }


    return;

}


void Training::dPdcN(string                  property,

                     Structure&              structure,

                     vector<vector<double>>& dPdc,

                     double                  delta)

{

    auto npe = getNumConnectionsPerElement();

    auto off = getConnectionOffsets();

    dPdc.clear();


    if (property == "energy")

    {

        dPdc.resize(1);

        for (size_t ie = 0; ie < numElements; ++ie)

        {

            for (size_t ic = 0; ic < npe.at(ie); ++ic)

            {

                size_t const o = off.at(ie) + ic;

                double const w = weights.at(0).at(o);


                weights.at(0).at(o) += delta;

                setWeights();

                calculateAtomicNeuralNetworks(structure, false);

                calculateEnergy(structure);

                double energyHigh = structure.energy;


                weights.at(0).at(o) -= 2.0 * delta;

                setWeights();

                calculateAtomicNeuralNetworks(structure, false);

                calculateEnergy(structure);

                double energyLow = structure.energy;


                dPdc.at(0).push_back((energyHigh - energyLow) / (2.0 * delta));

                weights.at(0).at(o) = w;

            }

        }

    }

    else if (property == "force")

    {

        size_t count = 0;

        dPdc.resize(3 * structure.numAtoms);

        for (size_t ia = 0; ia < structure.numAtoms; ++ia)

        {

            for (size_t ixyz = 0; ixyz < 3; ++ixyz)

            {

                for (size_t ie = 0; ie < numElements; ++ie)

                {

                    for (size_t ic = 0; ic < npe.at(ie); ++ic)

                    {

                        size_t const o = off.at(ie) + ic;

                        double const w = weights.at(0).at(o);


                        weights.at(0).at(o) += delta;

                        setWeights();

                        calculateAtomicNeuralNetworks(structure, true);

                        calculateForces(structure);

                        double forceHigh = structure.atoms.at(ia).f[ixyz];


                        weights.at(0).at(o) -= 2.0 * delta;

                        setWeights();

                        calculateAtomicNeuralNetworks(structure, true);

                        calculateForces(structure);

                        double forceLow = structure.atoms.at(ia).f[ixyz];


                        dPdc.at(count).push_back((forceHigh - forceLow)

                                                 / (2.0 * delta));

                        weights.at(0).at(o) = w;

                    }

                }

                count++;

            }

        }

    }

    else

    {

        throw runtime_error("ERROR: Numeric weight derivatives not "

                            "implemented for property \""

                            + property + "\".\n");

    }


    return;

}


bool Training::advance() const

{

    if (epoch < numEpochs) return true;

    else return false;

}


void Training::getWeights()

{

    if (updateStrategy == US_COMBINED)

    {

        size_t pos = 0;

        for (size_t i = 0; i < numElements; ++i)

        {

            NeuralNetwork const& nn = elements.at(i).neuralNetworks.at(nnId);

            nn.getConnections(&(weights.at(0).at(pos)));

            pos += nn.getNumConnections();

            // Leave slot for sqrt of hardness

            if (nnpType == NNPType::HDNNP_4G && stage == 1)

            {

                // TODO: check that hardness is positive?

                weights.at(0).at(pos) = sqrt(elements.at(i).getHardness());

                pos ++;

            }

        }

    }

    else if (updateStrategy == US_ELEMENT)

    {

        for (size_t i = 0; i < numElements; ++i)

        {

            NeuralNetwork const& nn = elements.at(i).neuralNetworks.at(nnId);

            nn.getConnections(&(weights.at(i).front()));

        }

    }


    return;

}


void Training::setWeights()

{

    if (updateStrategy == US_COMBINED)

    {

        size_t pos = 0;

        for (size_t i = 0; i < numElements; ++i)

        {

            NeuralNetwork& nn = elements.at(i).neuralNetworks.at(nnId);

            nn.setConnections(&(weights.at(0).at(pos)));

            pos += nn.getNumConnections();

            // hardness

            if (nnpType == NNPType::HDNNP_4G && stage == 1)

            {

                elements.at(i).setHardness(pow(weights.at(0).at(pos),2));

                pos ++;

            }

        }

    }

    else if (updateStrategy == US_ELEMENT)

    {

        for (size_t i = 0; i < numElements; ++i)

        {

            NeuralNetwork& nn = elements.at(i).neuralNetworks.at(nnId);

            nn.setConnections(&(weights.at(i).front()));

        }

    }


    return;

}


// Doxygen requires namespace prefix for arguments...


void Training::addTrainingLogEntry(int                 proc,

                                   std::size_t         il,

                                   double              f,

                                   std::size_t         isg,

                                   std::size_t         is)

{

    string s = strpr("  E %5zu %10zu %5d %3zu %10.2E %10zu %5zu\n",

                     epoch, countUpdates, proc, il + 1, f, isg, is);

    trainingLog << s;


    return;

}


// Doxygen requires namespace prefix for arguments...


void Training::addTrainingLogEntry(int                 proc,

                                   std::size_t         il,

                                   double              f,

                                   std::size_t         isg,

                                   std::size_t         is,

                                   std::size_t         ia,

                                   std::size_t         ic)

{

    string s = strpr("  F %5zu %10zu %5d %3zu %10.2E %10zu %5zu %5zu %2zu\n",

                     epoch, countUpdates, proc, il + 1, f, isg, is, ia, ic);

    trainingLog << s;


    return;

}


// Doxygen requires namespace prefix for arguments...


void Training::addTrainingLogEntry(int                 proc,

                                   std::size_t         il,

                                   double              f,

                                   std::size_t         isg,

                                   std::size_t         is,

                                   std::size_t         ia)

{

    string s = strpr("  Q %5zu %10zu %5d %3zu %10.2E %10zu %5zu %5zu\n",

                     epoch, countUpdates, proc, il + 1, f, isg, is, ia);

    trainingLog << s;


    return;

}


#ifndef N2P2_FULL_SFD_MEMORY


void Training::collectDGdxia(Atom const& atom,

                             size_t      indexAtom,

                             size_t      indexComponent)

{

    size_t const nsf = atom.numSymmetryFunctions;


    // Reset dGdxia array.

    dGdxia.clear();

    vector<double>(dGdxia).swap(dGdxia);

    if (nnpType == NNPType::HDNNP_4G)

        dGdxia.resize(nsf+1, 0.0);

    else

        dGdxia.resize(nsf, 0.0);


    vector<vector<size_t> > const& tableFull

        = elements.at(atom.element).getSymmetryFunctionTable();


    // TODO: Check if maxCutoffRadius is needed here

    for (size_t i = 0; i < atom.numNeighbors; i++)

    {

        if (atom.neighbors[i].index == indexAtom)

        {

            Atom::Neighbor const& n = atom.neighbors[i];

            vector<size_t> const& table = tableFull.at(n.element);

            for (size_t j = 0; j < n.dGdr.size(); ++j)

            {

                dGdxia[table.at(j)] += n.dGdr[j][indexComponent];

            }

        }

    }

    if (atom.index == indexAtom)

    {

        for (size_t i = 0; i < nsf; ++i)

        {

            dGdxia[i] += atom.dGdr[i][indexComponent];

        }

    }


    return;

}


#endif


void Training::randomizeNeuralNetworkWeights(string const& id)

{

    string keywordNW = "nguyen_widrow_weights" + nns.at(id).keywordSuffix2;


    double minWeights = atof(settings["weights_min"].c_str());

    double maxWeights = atof(settings["weights_max"].c_str());

    log << strpr("Initial weights selected randomly in interval "

                 "[%f, %f).\n", minWeights, maxWeights);

    vector<double> w;

    for (size_t i = 0; i < numElements; ++i)

    {

        NeuralNetwork& nn = elements.at(i).neuralNetworks.at(id);

        w.resize(nn.getNumConnections(), 0);

        for (size_t j = 0; j < w.size(); ++j)

        {

            w.at(j) = minWeights + gsl_rng_uniform(rngGlobal)

                    * (maxWeights - minWeights);

        }

        nn.setConnections(&(w.front()));

    }

    if (settings.keywordExists(keywordNW))

    {

        log << "Weights modified according to Nguyen Widrow scheme.\n";

        for (vector<Element>::iterator it = elements.begin();

             it != elements.end(); ++it)

        {

            NeuralNetwork& nn = it->neuralNetworks.at(id);

            nn.modifyConnections(NeuralNetwork::MS_NGUYENWIDROW);

        }

    }

    else if (settings.keywordExists("precondition_weights"))

    {

        throw runtime_error("ERROR: Preconditioning of weights not yet"

                            " implemented.\n");

    }

    else

    {

        log << "Weights modified accoring to Glorot Bengio scheme.\n";

        //log << "Weights connected to output layer node set to zero.\n";

        log << "Biases set to zero.\n";

        for (vector<Element>::iterator it = elements.begin();

             it != elements.end(); ++it)

        {

            NeuralNetwork& nn = it->neuralNetworks.at(id);

            nn.modifyConnections(NeuralNetwork::MS_GLOROTBENGIO);

            //nn->modifyConnections(NeuralNetwork::MS_ZEROOUTPUTWEIGHTS);

            nn.modifyConnections(NeuralNetwork::MS_ZEROBIAS);

        }

    }


    return;

}


void Training::setupSelectionMode(string const& property)

{

    bool all = (property == "all");

    bool isProperty = (find(pk.begin(), pk.end(), property) != pk.end());

    if (!(all || isProperty))

    {

        throw runtime_error("ERROR: Unknown property for selection mode"

                            " setup.\n");

    }


    if (all)

    {

        if (!(settings.keywordExists("selection_mode") ||

              settings.keywordExists("rmse_threshold") ||

              settings.keywordExists("rmse_threshold_trials"))) return;

        log << "Global selection mode settings:\n";

    }

    else

    {

        if (!(settings.keywordExists("selection_mode_" + property) ||

              settings.keywordExists("rmse_threshold_" + property) ||

              settings.keywordExists("rmse_threshold_trials_"

                                     + property))) return;

        log << "Selection mode settings specific to property \""

            << property << "\":\n";

    }

    string keyword;

    if (all) keyword = "selection_mode";

    else keyword = "selection_mode_" + property;


    if (settings.keywordExists(keyword))

    {

        map<size_t, SelectionMode> schedule;

        vector<string> args = split(settings[keyword]);

        if (args.size() % 2 != 1)

        {

            throw runtime_error("ERROR: Incorrect selection mode format.\n");

        }

        schedule[0] = (SelectionMode)atoi(args.at(0).c_str());

        for (size_t i = 1; i < args.size(); i = i + 2)

        {

            schedule[(size_t)atoi(args.at(i).c_str())] =

                (SelectionMode)atoi(args.at(i + 1).c_str());

        }

        for (map<size_t, SelectionMode>::const_iterator it = schedule.begin();

             it != schedule.end(); ++it)

        {

            log << strpr("- Selection mode starting with epoch %zu:\n",

                         it->first);

            if (it->second == SM_RANDOM)

            {

                log << strpr("  Random selection of update candidates: "

                             "SelectionMode::SM_RANDOM (%d)\n", it->second);

            }

            else if (it->second == SM_SORT)

            {

                log << strpr("  Update candidates selected according to error: "

                             "SelectionMode::SM_SORT (%d)\n", it->second);

            }

            else if (it->second == SM_THRESHOLD)

            {

                log << strpr("  Update candidates chosen randomly above RMSE "

                             "threshold: SelectionMode::SM_THRESHOLD (%d)\n",

                             it->second);

            }

            else

            {

                throw runtime_error("ERROR: Unknown selection mode.\n");

            }

        }

        if (all)

        {

            for (auto& i : p)

            {

                i.second.selectionModeSchedule = schedule;

                i.second.selectionMode = schedule[0];

            }

        }

        else

        {

            p[property].selectionModeSchedule = schedule;

            p[property].selectionMode = schedule[0];

        }

    }


    if (all) keyword = "rmse_threshold";

    else keyword = "rmse_threshold_" + property;

    if (settings.keywordExists(keyword))

    {

        double t = atof(settings[keyword].c_str());

        log << strpr("- RMSE selection threshold: %.2f * RMSE\n", t);

        if (all) for (auto& i : p) i.second.rmseThreshold = t;

        else p[property].rmseThreshold = t;

    }


    if (all) keyword = "rmse_threshold_trials";

    else keyword = "rmse_threshold_trials_" + property;

    if (settings.keywordExists(keyword))

    {

        size_t t = atoi(settings[keyword].c_str());

        log << strpr("- RMSE selection trials   : %zu\n", t);

        if (all) for (auto& i : p) i.second.rmseThresholdTrials = t;

        else p[property].rmseThresholdTrials = t;

    }


    return;

}


void Training::setupFileOutput(string const& type)

{

    string keyword = "write_";

    bool isProperty = (find(pk.begin(), pk.end(), type) != pk.end());

    if      (type == "energy"       ) keyword += "trainpoints";

    else if (type == "force"        ) keyword += "trainforces";

    else if (type == "charge"       ) keyword += "traincharges";

    else if (type == "weights_epoch") keyword += type;

    else if (type == "neuronstats"  ) keyword += type;

    else

    {

        throw runtime_error("ERROR: Invalid type for file output setup.\n");

    }


    // Check how often energy comparison files should be written.

    if (settings.keywordExists(keyword))

    {

        size_t* writeEvery = nullptr;

        size_t* writeAlways = nullptr;

        string message;

        if (isProperty)

        {

            writeEvery = &(p[type].writeCompEvery);

            writeAlways = &(p[type].writeCompAlways);

            message = "Property \"" + type + "\" comparison";

            message.at(0) = toupper(message.at(0));

        }

        else if (type == "weights_epoch")

        {

            writeEvery = &writeWeightsEvery;

            writeAlways = &writeWeightsAlways;

            message = "Weight";

        }

        else if (type == "neuronstats")

        {

            writeEvery = &writeNeuronStatisticsEvery;

            writeAlways = &writeNeuronStatisticsAlways;

            message = "Neuron statistics";

        }


        *writeEvery = 1;

        vector<string> v = split(reduce(settings[keyword]));

        if (v.size() == 1) *writeEvery = (size_t)atoi(v.at(0).c_str());

        else if (v.size() == 2)

        {

            *writeEvery = (size_t)atoi(v.at(0).c_str());

            *writeAlways = (size_t)atoi(v.at(1).c_str());

        }

        log << strpr((message

                      + " files will be written every %zu epochs.\n").c_str(),

                     *writeEvery);

        if (*writeAlways > 0)

        {

            log << strpr((message

                          + " files will always be written up to epoch "

                            "%zu.\n").c_str(), *writeAlways);

        }

    }


    return;

}


void Training::setupUpdatePlan(string const& property)

{

    bool isProperty = (find(pk.begin(), pk.end(), property) != pk.end());

    if (!isProperty)

    {

        throw runtime_error("ERROR: Unknown property for update plan"

                            " setup.\n");

    }


    // Actual property modified here.

    Property& pa = p[property];

    string keyword = property + "_fraction";


    // Override force fraction if keyword "energy_force_ratio" is provided.

    if (property == "force" &&

        p.exists("energy") &&

        settings.keywordExists("force_energy_ratio"))

    {

        double const ratio = atof(settings["force_energy_ratio"].c_str());

        if (settings.keywordExists(keyword))

        {

            log << "WARNING: Given force fraction is ignored because "

                   "force/energy ratio is provided.\n";

        }

        log << strpr("Desired force/energy update ratio              : %.6f\n",

                     ratio);

        log << "----------------------------------------------\n";

        pa.epochFraction = (p["energy"].numTrainPatterns * ratio)

                         / p["force"].numTrainPatterns;

    }

    // Default action = read "<property>_fraction" keyword.

    else

    {

    pa.epochFraction = atof(settings[keyword].c_str());

    }


    keyword = "task_batch_size_" + property;

    pa.taskBatchSize = (size_t)atoi(settings[keyword].c_str());

    if (pa.taskBatchSize == 0)

    {

        pa.patternsPerUpdate =

            static_cast<size_t>(pa.updateCandidates.size() * pa.epochFraction);

        pa.numUpdates = 1;

    }

    else

    {

        pa.patternsPerUpdate = pa.taskBatchSize;

        pa.numUpdates =

            static_cast<size_t>((pa.numTrainPatterns * pa.epochFraction)

                                / pa.taskBatchSize / numProcs);

    }

    pa.patternsPerUpdateGlobal = pa.patternsPerUpdate;

    MPI_Allreduce(MPI_IN_PLACE, &(pa.patternsPerUpdateGlobal), 1, MPI_SIZE_T, MPI_SUM, comm);

    pa.errorsPerTask.resize(numProcs, 0);

    if (jacobianMode == JM_FULL)

    {

        pa.errorsPerTask.at(myRank) = static_cast<int>(pa.patternsPerUpdate);

    }

    else

    {

        pa.errorsPerTask.at(myRank) = 1;

    }

    MPI_Allgather(MPI_IN_PLACE, 1, MPI_INT, &(pa.errorsPerTask.front()), 1, MPI_INT, comm);

    if (jacobianMode == JM_FULL)

    {

        pa.weightsPerTask.resize(numUpdaters);

        for (size_t i = 0; i < numUpdaters; ++i)

        {

            pa.weightsPerTask.at(i).resize(numProcs, 0);

            for (int j = 0; j < numProcs; ++j)

            {

                pa.weightsPerTask.at(i).at(j) = pa.errorsPerTask.at(j)

                                              * numWeightsPerUpdater.at(i);

            }

        }

    }

    pa.numErrorsGlobal = 0;

    for (size_t i = 0; i < pa.errorsPerTask.size(); ++i)

    {

        pa.offsetPerTask.push_back(pa.numErrorsGlobal);

        pa.numErrorsGlobal += pa.errorsPerTask.at(i);

    }

    pa.offsetJacobian.resize(numUpdaters);

    for (size_t i = 0; i < numUpdaters; ++i)

    {

        for (size_t j = 0; j < pa.offsetPerTask.size(); ++j)

        {

            pa.offsetJacobian.at(i).push_back(pa.offsetPerTask.at(j) *

                                              numWeightsPerUpdater.at(i));

        }

    }

    log << "Update plan for property \"" + property + "\":\n";

    log << strpr("- Per-task batch size                          : %zu\n",

                 pa.taskBatchSize);

    log << strpr("- Fraction of patterns used per epoch          : %.6f\n",

                 pa.epochFraction);

    if (pa.numUpdates == 0)

    {

        log << "WARNING: No updates are planned for this property.";

    }

    log << strpr("- Updates per epoch                            : %zu\n",

                 pa.numUpdates);

    log << strpr("- Patterns used per update (rank %3d / global) : "

                 "%10zu / %zu\n",

                 myRank, pa.patternsPerUpdate, pa.patternsPerUpdateGlobal);

    log << "----------------------------------------------\n";


    return;

}


void Training::allocateArrays(string const& property)

{

    bool isProperty = (find(pk.begin(), pk.end(), property) != pk.end());

    if (!isProperty)

    {

        throw runtime_error("ERROR: Unknown property for array allocation.\n");

    }


    log << "Allocating memory for " + property +

           " error vector and Jacobian.\n";

    Property& pa = p[property];

    pa.error.resize(numUpdaters);

    pa.jacobian.resize(numUpdaters);

    for (size_t i = 0; i < numUpdaters; ++i)

    {

        size_t size = 1;

        if (( parallelMode == PM_TRAIN_ALL ||

              (parallelMode == PM_TRAIN_RK0 && myRank == 0)) &&

            jacobianMode != JM_SUM)

        {

            size *= pa.numErrorsGlobal;

        }

        else if ((parallelMode == PM_TRAIN_RK0 && myRank != 0) &&

                 jacobianMode != JM_SUM)

        {

            size *= pa.errorsPerTask.at(myRank);

        }

        pa.error.at(i).resize(size, 0.0);

        pa.jacobian.at(i).resize(size * numWeightsPerUpdater.at(i), 0.0);

        log << strpr("Updater %3zu:\n", i);

        log << strpr(" - Error    size: %zu\n", pa.error.at(i).size());

        log << strpr(" - Jacobian size: %zu\n", pa.jacobian.at(i).size());

    }

    log << "----------------------------------------------\n";


    return;

}


void Training::writeTimingData(bool append, string const fileName)

{

    ofstream file;

    string fileNameActual = fileName;

    if (nnpType == NNPType::HDNNP_4G ||

        nnpType == NNPType::HDNNP_Q)

    {

        fileNameActual += strpr(".stage-%zu", stage);

    }


    vector<string> sub = {"_err", "_com", "_upd", "_log"};

    if (append) file.open(fileNameActual.c_str(), ofstream::app);

    else

    {

        file.open(fileNameActual.c_str());


        // File header.

        vector<string> title;

        vector<string> colName;

        vector<string> colInfo;

        vector<size_t> colSize;

        title.push_back("Timing data for training loop.");

        colSize.push_back(10);

        colName.push_back("epoch");

        colInfo.push_back("Current epoch.");

        colSize.push_back(11);

        colName.push_back("train");

        colInfo.push_back("Time for training.");

        colSize.push_back(7);

        colName.push_back("ptrain");

        colInfo.push_back("Time for training (percentage of loop).");

        colSize.push_back(11);

        colName.push_back("error");

        colInfo.push_back("Time for error calculation.");

        colSize.push_back(7);

        colName.push_back("perror");

        colInfo.push_back("Time for error calculation (percentage of loop).");

        colSize.push_back(11);

        colName.push_back("epoch");

        colInfo.push_back("Time for this epoch.");

        colSize.push_back(11);

        colName.push_back("total");

        colInfo.push_back("Total time for all epochs.");

        for (auto k : pk)

        {

            colSize.push_back(11);

            colName.push_back(p[k].tiny + "train");

            colInfo.push_back("");

            colSize.push_back(7);

            colName.push_back(p[k].tiny + "ptrain");

            colInfo.push_back("");

        }

        for (auto s : sub)

        {

            for (auto k : pk)

            {

                colSize.push_back(11);

                colName.push_back(p[k].tiny + s);

                colInfo.push_back("");

                colSize.push_back(7);

                colName.push_back(p[k].tiny + "p" + s);

                colInfo.push_back("");

            }

        }

        appendLinesToFile(file,

                          createFileHeader(title, colSize, colName, colInfo));

    }


    double timeLoop = sw["loop"].getLoop();

    file << strpr("%10zu", epoch);

    file << strpr(" %11.3E", sw["train"].getLoop());

    file << strpr(" %7.3f", sw["train"].getLoop() / timeLoop);

    file << strpr(" %11.3E", sw["error"].getLoop());

    file << strpr(" %7.3f", sw["error"].getLoop() / timeLoop);

    file << strpr(" %11.3E", timeLoop);

    file << strpr(" %11.3E", sw["loop"].getTotal());


    for (auto k : pk)

    {

        file << strpr(" %11.3E", sw[k].getLoop());

        file << strpr(" %7.3f", sw[k].getLoop() / sw["train"].getLoop());

    }

    for (auto s : sub)

    {

        for (auto k : pk)

        {

            file << strpr(" %11.3E", sw[k + s].getLoop());

            file << strpr(" %7.3f", sw[k + s].getLoop() / sw[k].getLoop());

        }

    }

    file << "\n";


    file.flush();

    file.close();


    return;

}


Training::Property::Property(string const& property) :

    property               (property ),

    displayMetric          (""       ),

    tiny                   (""       ),

    plural                 (""       ),

    selectionMode          (SM_RANDOM),

    numTrainPatterns       (0        ),

    numTestPatterns        (0        ),

    taskBatchSize          (0        ),

    writeCompEvery         (0        ),

    writeCompAlways        (0        ),

    posUpdateCandidates    (0        ),

    numGroupedSubCand      (0        ),

    countGroupedSubCand    (0        ),

    rmseThresholdTrials    (0        ),

    countUpdates           (0        ),

    numUpdates             (0        ),

    patternsPerUpdate      (0        ),

    patternsPerUpdateGlobal(0        ),

    numErrorsGlobal        (0        ),

    epochFraction          (0.0      ),

    rmseThreshold          (0.0      )

{

    if (property == "energy")

    {

        tiny = "E";

        plural = "energies";

        errorMetrics = {"RMSEpa", "RMSE", "MAEpa", "MAE"};

    }

    else if (property == "force")

    {

        tiny = "F";

        plural = "forces";

        errorMetrics = {"RMSE", "MAE"};

    }

    else if (property == "charge")

    {

        tiny = "Q";

        plural = "charges";

        errorMetrics = {"RMSE", "MAE"};

    }

    else

    {

        throw runtime_error("ERROR: Unknown training property.\n");

    }


    // Set up error metrics

    for (auto m : errorMetrics)

    {

        errorTrain[m] = 0.0;

        errorTest[m] = 0.0;

    }

    displayMetric = errorMetrics.at(0);

}


GradientDescent.h

KalmanFilter.h

NeuralNetwork.h

Training.h

nnp::Dataset::numStructures
std::size_t numStructures
Total number of structures in dataset.
Definition Dataset.h:203

nnp::Dataset::rng
gsl_rng * rng
GSL random number generator (different seed for each MPI process).
Definition Dataset.h:209

nnp::Dataset::Dataset
Dataset()
Constructor, initialize members.
Definition Dataset.cpp:36

nnp::Dataset::comm
MPI_Comm comm
Global MPI communicator.
Definition Dataset.h:207

nnp::Dataset::numProcs
int numProcs
Total number of MPI processors.
Definition Dataset.h:201

nnp::Dataset::structures
std::vector< Structure > structures
All structures in this dataset.
Definition Dataset.h:195

nnp::Dataset::combineFiles
void combineFiles(std::string filePrefix) const
Combine individual MPI proc files to one.
Definition Dataset.cpp:1744

nnp::Dataset::myRank
int myRank
My process ID.
Definition Dataset.h:199

nnp::Dataset::rngGlobal
gsl_rng * rngGlobal
Global GSL random number generator (equal seed for each MPI process).
Definition Dataset.h:211

nnp::Dataset::collectError
void collectError(std::string const &property, std::map< std::string, double > &error, std::size_t &count) const
Collect error metrics of a property over all MPI procs.
Definition Dataset.cpp:1712

nnp::GradientDescent
Weight updates based on simple gradient descent methods.
Definition GradientDescent.h:30

nnp::GradientDescent::setParametersFixed
void setParametersFixed(double const eta)
Set parameters for fixed step gradient descent algorithm.
Definition GradientDescent.cpp:120

nnp::GradientDescent::setParametersAdam
void setParametersAdam(double const eta, double const beta1, double const beta2, double const epsilon)
Set parameters for Adam algorithm.
Definition GradientDescent.cpp:127

nnp::GradientDescent::DescentType
DescentType
Enumerate different gradient descent variants.
Definition GradientDescent.h:34

nnp::GradientDescent::DT_ADAM
@ DT_ADAM
Adaptive moment estimation (Adam).
Definition GradientDescent.h:38

nnp::GradientDescent::DT_FIXED
@ DT_FIXED
Fixed step size.
Definition GradientDescent.h:36

nnp::KalmanFilter
Implementation of the Kalman filter method.
Definition KalmanFilter.h:32

nnp::KalmanFilter::setParametersStandard
void setParametersStandard(double const epsilon, double const q0, double const qtau, double const qmin, double const eta0, double const etatau, double const etamax)
Set parameters for standard Kalman filter.
Definition KalmanFilter.cpp:199

nnp::KalmanFilter::setParametersFadingMemory
void setParametersFadingMemory(double const epsilon, double const q0, double const qtau, double const qmin, double const lambda, double const nu)
Set parameters for fading memory Kalman filter.
Definition KalmanFilter.cpp:222

nnp::KalmanFilter::KalmanType
KalmanType
Enumerate different Kalman filter types.
Definition KalmanFilter.h:36

nnp::KalmanFilter::KT_STANDARD
@ KT_STANDARD
Regular Kalman filter.
Definition KalmanFilter.h:38

nnp::KalmanFilter::KT_FADINGMEMORY
@ KT_FADINGMEMORY
Kalman filtering with fading memory modification.
Definition KalmanFilter.h:40

nnp::KalmanFilter::setSizeObservation
void setSizeObservation(std::size_t const sizeObservation)
Set observation vector size.
Definition KalmanFilter.cpp:76

nnp::Mode::cutoffs
std::vector< std::vector< double > > cutoffs
Matrix storing all symmetry function cut-offs for all elements.
Definition Mode.h:689

nnp::Mode::normalize
bool normalize
Definition Mode.h:665

nnp::Mode::convEnergy
double convEnergy
Definition Mode.h:673

nnp::Mode::setupNormalization
void setupNormalization(bool standalone=true)
Set up normalization.
Definition Mode.cpp:239

nnp::Mode::elementMap
ElementMap elementMap
Global element map, populated by setupElementMap().
Definition Mode.h:627

nnp::Mode::nnpType
NNPType nnpType
Definition Mode.h:664

nnp::Mode::addEnergyOffset
void addEnergyOffset(Structure &structure, bool ref=true)
Add atomic energy offsets to reference energy.
Definition Mode.cpp:2034

nnp::Mode::convLength
double convLength
Definition Mode.h:674

nnp::Mode::readNeuralNetworkWeights
void readNeuralNetworkWeights(std::string const &id, std::string const &fileName)
Read in weights for a specific type of neural network.
Definition Mode.cpp:2286

nnp::Mode::setupSymmetryFunctionCache
virtual void setupSymmetryFunctionCache(bool verbose=false)
Set up symmetry function cache.
Definition Mode.cpp:1008

nnp::Mode::maxCutoffRadius
double maxCutoffRadius
Definition Mode.h:670

nnp::Mode::NNPType::HDNNP_2G
@ HDNNP_2G
Short range NNP (2G-HDNNP).
Definition Mode.h:93

nnp::Mode::NNPType::HDNNP_Q
@ HDNNP_Q
Short range NNP with charge NN, no electrostatics/Qeq (M.
Definition Mode.h:103

nnp::Mode::NNPType::HDNNP_4G
@ HDNNP_4G
NNP with electrostatics and non-local charge transfer (4G-HDNNP).
Definition Mode.h:95

nnp::Mode::meanEnergy
double meanEnergy
Definition Mode.h:672

nnp::Mode::screeningFunction
ScreeningFunction screeningFunction
Definition Mode.h:682

nnp::Mode::calculateAtomicNeuralNetworks
void calculateAtomicNeuralNetworks(Structure &structure, bool const derivatives, std::string id="")
Calculate a single atomic neural network for a given atom and nn type.
Definition Mode.cpp:1666

nnp::Mode::physical
double physical(std::string const &property, double value) const
Undo normalization for a given property.
Definition Mode.cpp:2126

nnp::Mode::setupSymmetryFunctionGroups
virtual void setupSymmetryFunctionGroups()
Set up symmetry function groups.
Definition Mode.cpp:866

nnp::Mode::elements
std::vector< Element > elements
Definition Mode.h:683

nnp::Mode::normalized
double normalized(std::string const &property, double value) const
Apply normalization to given property.
Definition Mode.cpp:2100

nnp::Mode::numElements
std::size_t numElements
Definition Mode.h:667

nnp::Mode::calculateEnergy
void calculateEnergy(Structure &structure) const
Calculate potential energy for a given structure.
Definition Mode.cpp:1831

nnp::Mode::calculateSymmetryFunctionGroups
void calculateSymmetryFunctionGroups(Structure &structure, bool const derivatives)
Calculate all symmetry function groups for all atoms in given structure.
Definition Mode.cpp:1585

nnp::Mode::setupSymmetryFunctionScaling
virtual void setupSymmetryFunctionScaling(std::string const &fileName="scaling.data")
Set up symmetry function scaling from file.
Definition Mode.cpp:736

nnp::Mode::removeEnergyOffset
void removeEnergyOffset(Structure &structure, bool ref=true)
Remove atomic energy offsets from reference energy.
Definition Mode.cpp:2053

nnp::Mode::log
Log log
Global log file.
Definition Mode.h:629

nnp::Mode::getEnergyWithOffset
double getEnergyWithOffset(Structure const &structure, bool ref=true) const
Add atomic energy offsets and return energy.
Definition Mode.cpp:2085

nnp::Mode::setupSymmetryFunctions
virtual void setupSymmetryFunctions()
Set up all symmetry functions.
Definition Mode.cpp:639

nnp::Mode::chargeEquilibration
void chargeEquilibration(Structure &structure, bool const derivativesElec)
Perform global charge equilibration method.
Definition Mode.cpp:1779

nnp::Mode::calculateSymmetryFunctions
void calculateSymmetryFunctions(Structure &structure, bool const derivatives)
Calculate all symmetry functions for all atoms in given structure.
Definition Mode.cpp:1504

nnp::Mode::nns
std::map< std::string, NNSetup > nns
Definition Mode.h:686

nnp::Mode::ewaldSetup
EwaldSetup ewaldSetup
Definition Mode.h:677

nnp::Mode::calculateForces
void calculateForces(Structure &structure) const
Calculate forces for all atoms in given structure.
Definition Mode.cpp:1877

nnp::Mode::setupSymmetryFunctionStatistics
void setupSymmetryFunctionStatistics(bool collectStatistics, bool collectExtrapolationWarnings, bool writeExtrapolationWarnings, bool stopOnExtrapolationWarnings)
Set up symmetry function statistics collection.
Definition Mode.cpp:1127

nnp::Mode::setupSymmetryFunctionMemory
void setupSymmetryFunctionMemory(bool verbose=false)
Extract required memory dimensions for symmetry function derivatives.
Definition Mode.cpp:918

nnp::Mode::writeSettingsFile
void writeSettingsFile(std::ofstream *const &file) const
Write complete settings file.
Definition Mode.cpp:2237

nnp::NeuralNetwork
This class implements a feed-forward neural network.
Definition NeuralNetwork.h:29

nnp::NeuralNetwork::getNumConnections
int getNumConnections() const
Return total number of connections.
Definition NeuralNetwork.cpp:132

nnp::NeuralNetwork::setInput
void setInput(double const *const &input) const
Set neural network input layer node values.
Definition NeuralNetwork.cpp:357

nnp::NeuralNetwork::modifyConnections
void modifyConnections(ModificationScheme modificationScheme)
Change connections according to a given modification scheme.
Definition NeuralNetwork.cpp:212

nnp::NeuralNetwork::setConnections
void setConnections(double const *const &connections)
Set neural network weights and biases.
Definition NeuralNetwork.cpp:147

nnp::NeuralNetwork::calculateDFdc
void calculateDFdc(double *dFdc, double const *const &dGdxyz) const
Calculate "second" derivative of output with respect to connections.
Definition NeuralNetwork.cpp:490

nnp::NeuralNetwork::MS_ZEROBIAS
@ MS_ZEROBIAS
Set all bias values to zero.
Definition NeuralNetwork.h:62

nnp::NeuralNetwork::MS_GLOROTBENGIO
@ MS_GLOROTBENGIO
Normalize connections according to Glorot and Bengio.
Definition NeuralNetwork.h:90

nnp::NeuralNetwork::MS_NGUYENWIDROW
@ MS_NGUYENWIDROW
Initialize connections according to Nguyen-Widrow scheme.
Definition NeuralNetwork.h:102

nnp::NeuralNetwork::getConnections
void getConnections(double *connections) const
Get neural network weights and biases.
Definition NeuralNetwork.cpp:171

nnp::NeuralNetwork::propagate
void propagate()
Propagate input information through all layers.
Definition NeuralNetwork.cpp:386

nnp::NeuralNetwork::calculateDEdc
void calculateDEdc(double *dEdc) const
Calculate derivative of output neuron with respect to connections.
Definition NeuralNetwork.cpp:444

nnp::NeuralNetwork::calculateDEdG
void calculateDEdG(double *dEdG) const
Calculate derivative of output neuron with respect to input neurons.
Definition NeuralNetwork.cpp:396

nnp::NeuralNetwork::getOutput
void getOutput(double *output) const
Get neural network output layer node values.
Definition NeuralNetwork.cpp:376

nnp::Training::setTrainingLogFileName
void setTrainingLogFileName(std::string fileName)
Set training log file name.
Definition Training.cpp:3265

nnp::Training::updaterType
UpdaterType updaterType
Updater type used.
Definition Training.h:503

nnp::Training::dGdxia
std::vector< double > dGdxia
Derivative of symmetry functions with respect to one specific atom coordinate.
Definition Training.h:565

nnp::Training::epoch
std::size_t epoch
Current epoch.
Definition Training.h:529

nnp::Training::numWeightsPerUpdater
std::vector< std::size_t > numWeightsPerUpdater
Number of weights per updater.
Definition Training.h:556

nnp::Training::writeWeightsAlways
std::size_t writeWeightsAlways
Up to this epoch weights are written every epoch.
Definition Training.h:533

nnp::Training::numWeights
std::size_t numWeights
Total number of weights.
Definition Training.h:542

nnp::Training::useForces
bool useForces
Use forces for training.
Definition Training.h:515

nnp::Training::writeWeightsEvery
std::size_t writeWeightsEvery
Write weights every this many epochs.
Definition Training.h:531

nnp::Training::setupTraining
void setupTraining()
General training settings and setup of weight update routine.
Definition Training.cpp:737

nnp::Training::rngGlobalNew
std::mt19937_64 rngGlobalNew
Global random number generator.
Definition Training.h:579

nnp::Training::nnId
std::string nnId
ID of neural network the training is working on.
Definition Training.h:548

nnp::Training::writeHardness
void writeHardness(std::string const &fileNameFormat) const
Write hardness to files (one file for each element).
Definition Training.cpp:1702

nnp::Training::allocateArrays
void allocateArrays(std::string const &property)
Allocate error and Jacobian arrays for given property.
Definition Training.cpp:3949

nnp::Training::writeWeightsEpoch
void writeWeightsEpoch() const
Write weights to files during training loop.
Definition Training.cpp:1679

nnp::Training::trainingLog
std::ofstream trainingLog
Training log file.
Definition Training.h:550

nnp::Training::hasUpdaters
bool hasUpdaters
If this rank performs weight updates.
Definition Training.h:511

nnp::Training::checkSelectionMode
void checkSelectionMode()
Check if selection mode should be changed.
Definition Training.cpp:2114

nnp::Training::trainingLogFileName
std::string trainingLogFileName
File name for training log.
Definition Training.h:546

nnp::Training::jacobianMode
JacobianMode jacobianMode
Jacobian mode used.
Definition Training.h:507

nnp::Training::selectSets
void selectSets()
Randomly select training and test set structures.
Definition Training.cpp:82

nnp::Training::JacobianMode
JacobianMode
Jacobian matrix preparation mode.
Definition Training.h:85

nnp::Training::JM_SUM
@ JM_SUM
No Jacobian, sum up contributions from update candidates.
Definition Training.h:87

nnp::Training::JM_TASK
@ JM_TASK
Prepare one Jacobian entry for each task, sum up within tasks.
Definition Training.h:89

nnp::Training::JM_FULL
@ JM_FULL
Prepare full Jacobian matrix.
Definition Training.h:91

nnp::Training::randomizeNeuralNetworkWeights
void randomizeNeuralNetworkWeights(std::string const &id)
Randomly initialize specificy neural network weights.
Definition Training.cpp:3616

nnp::Training::countUpdates
std::size_t countUpdates
Update counter (for all training quantities together).
Definition Training.h:539

nnp::Training::sw
std::map< std::string, Stopwatch > sw
Stopwatches for timing overview.
Definition Training.h:575

nnp::Training::setupSelectionMode
void setupSelectionMode(std::string const &property)
Set selection mode for specific training property.
Definition Training.cpp:3669

nnp::Training::dPdc
void dPdc(std::string property, Structure &structure, std::vector< std::vector< double > > &dEdc)
Compute derivatives of property with respect to weights.
Definition Training.cpp:3307

nnp::Training::printHeader
void printHeader()
Print training loop header on screen.
Definition Training.cpp:1558

nnp::Training::rngNew
std::mt19937_64 rngNew
Per-task random number generator.
Definition Training.h:577

nnp::Training::p
PropertyMap p
Actual training properties.
Definition Training.h:581

nnp::Training::updaters
std::vector< Updater * > updaters
Weight updater (combined or for each element).
Definition Training.h:572

nnp::Training::writeNeuronStatisticsAlways
std::size_t writeNeuronStatisticsAlways
Up to this epoch neuron statistics are written every epoch.
Definition Training.h:537

nnp::Training::UpdaterType
UpdaterType
Type of update routine.
Definition Training.h:40

nnp::Training::UT_GD
@ UT_GD
Simple gradient descent methods.
Definition Training.h:42

nnp::Training::UT_KF
@ UT_KF
Kalman filter-based methods.
Definition Training.h:44

nnp::Training::UT_LM
@ UT_LM
Levenberg-Marquardt algorithm.
Definition Training.h:46

nnp::Training::forceWeight
double forceWeight
Force update weight.
Definition Training.h:544

nnp::Training::update
void update(std::string const &property)
Perform one update.
Definition Training.cpp:2256

nnp::Training::dataSetNormalization
void dataSetNormalization()
Apply normalization based on initial weights prediction.
Definition Training.cpp:429

nnp::Training::ParallelMode
ParallelMode
Training parallelization mode.
Definition Training.h:56

nnp::Training::PM_TRAIN_RK0
@ PM_TRAIN_RK0
No training parallelization, only data set distribution.
Definition Training.h:71

nnp::Training::PM_TRAIN_ALL
@ PM_TRAIN_ALL
Parallel gradient computation, update on each task.
Definition Training.h:80

nnp::Training::writeTrainingLog
bool writeTrainingLog
Whether training log file is written.
Definition Training.h:521

nnp::Training::numUpdaters
std::size_t numUpdaters
Number of updaters (depends on update strategy).
Definition Training.h:525

nnp::Training::advance
bool advance() const
Check if training loop should be continued.
Definition Training.cpp:3461

nnp::Training::~Training
~Training()
Destructor, updater vector needs to be cleaned.
Definition Training.cpp:64

nnp::Training::sortUpdateCandidates
void sortUpdateCandidates(std::string const &property)
Sort update candidates with descending RMSE.
Definition Training.cpp:2008

nnp::Training::writeNeuronStatisticsEpoch
void writeNeuronStatisticsEpoch() const
Write neuron statistics during training loop.
Definition Training.cpp:1943

nnp::Training::SelectionMode
SelectionMode
How update candidates are selected during Training.
Definition Training.h:105

nnp::Training::SM_RANDOM
@ SM_RANDOM
Select candidates randomly.
Definition Training.h:107

nnp::Training::SM_THRESHOLD
@ SM_THRESHOLD
Select candidates randomly with RMSE above threshold.
Definition Training.h:111

nnp::Training::SM_SORT
@ SM_SORT
Sort candidates according to their RMSE and pick worst first.
Definition Training.h:109

nnp::Training::stage
std::size_t stage
Training stage.
Definition Training.h:523

nnp::Training::collectDGdxia
void collectDGdxia(Atom const &atom, std::size_t indexAtom, std::size_t indexComponent)
Collect derivative of symmetry functions with respect to one atom's coordinate.
Definition Training.cpp:3574

nnp::Training::writeHardnessEpoch
void writeHardnessEpoch() const
Write hardness to files during training loop.
Definition Training.cpp:1720

nnp::Training::setWeights
void setWeights()
Set weights in neural network class.
Definition Training.cpp:3498

nnp::Training::loop
void loop()
Execute main training loop.
Definition Training.cpp:2147

nnp::Training::printEpoch
void printEpoch()
Print preferred error metric and timing information on screen.
Definition Training.cpp:1616

nnp::Training::weightsOffset
std::vector< std::size_t > weightsOffset
Offset of each element's weights in combined array.
Definition Training.h:559

nnp::Training::numEpochs
std::size_t numEpochs
Number of epochs requested.
Definition Training.h:527

nnp::Training::setupFileOutput
void setupFileOutput(std::string const &type)
Set file output intervals for properties and other quantities.
Definition Training.cpp:3777

nnp::Training::getNumConnections
std::size_t getNumConnections(std::string id="short") const
Get total number of NN connections.
Definition Training.cpp:3272

nnp::Training::addTrainingLogEntry
void addTrainingLogEntry(int proc, std::size_t il, double f, std::size_t isg, std::size_t is)
Write energy update data to training log file.
Definition Training.cpp:3529

nnp::Training::writeTimingData
void writeTimingData(bool append, std::string const fileName="timing.out")
Write timing data for all clocks.
Definition Training.cpp:3987

nnp::Training::writeNeuronStatisticsEvery
std::size_t writeNeuronStatisticsEvery
Write neuron statistics every this many epochs.
Definition Training.h:535

nnp::Training::getWeights
void getWeights()
Get weights from neural network class.
Definition Training.cpp:3467

nnp::Training::dPdcN
void dPdcN(std::string property, Structure &structure, std::vector< std::vector< double > > &dEdc, double delta=1.0E-4)
Compute numeric derivatives of property with respect to weights.
Definition Training.cpp:3379

nnp::Training::setupNumericDerivCheck
std::vector< std::string > setupNumericDerivCheck()
Set up numeric weight derivatives check.
Definition Training.cpp:1209

nnp::Training::setSingleWeight
void setSingleWeight(std::size_t element, std::size_t index, double value)
Set a single weight value.
Definition Training.cpp:3165

nnp::Training::shuffleUpdateCandidates
void shuffleUpdateCandidates(std::string const &property)
Shuffle update candidates.
Definition Training.cpp:2062

nnp::Training::calculateChargeErrorVec
void calculateChargeErrorVec(Structure const &s, Eigen::VectorXd &cVec, double &cNorm)
Calculate vector of charge errors in one structure.
Definition Training.cpp:1545

nnp::Training::getSingleWeight
double getSingleWeight(std::size_t element, std::size_t index)
Get a single weight value.
Definition Training.cpp:3158

nnp::Training::initializeWeights
void initializeWeights()
Initialize weights for all elements.
Definition Training.cpp:292

nnp::Training::initializeWeightsMemory
void initializeWeightsMemory(UpdateStrategy updateStrategy=US_COMBINED)
Initialize weights vector according to update strategy.
Definition Training.cpp:330

nnp::Training::repeatedEnergyUpdates
bool repeatedEnergyUpdates
After force update perform energy update for corresponding structure.
Definition Training.h:517

nnp::Training::updateStrategy
UpdateStrategy updateStrategy
Update strategy used.
Definition Training.h:509

nnp::Training::calculateNeighborLists
void calculateNeighborLists()
Calculate neighbor lists for all structures.
Definition Training.cpp:1247

nnp::Training::parallelMode
ParallelMode parallelMode
Parallelization mode used.
Definition Training.h:505

nnp::Training::writeNeuronStatistics
void writeNeuronStatistics(std::string const &nnName, std::string const &fileName) const
Write neuron statistics collected since last invocation.
Definition Training.cpp:1844

nnp::Training::getConnectionOffsets
std::vector< std::size_t > getConnectionOffsets(std::string id="short") const
Get offsets of NN connections for each element.
Definition Training.cpp:3294

nnp::Training::epochSchedule
std::vector< int > epochSchedule
Update schedule epoch (stage 1: 0 = charge update; stage 2: 0 = energy update, 1 = force update (opti...
Definition Training.h:553

nnp::Training::writeUpdaterStatus
void writeUpdaterStatus(bool append, std::string const fileNameFormat="updater.%03zu.out") const
Write updater information to file.
Definition Training.cpp:1972

nnp::Training::UpdateStrategy
UpdateStrategy
Update strategies available for Training.
Definition Training.h:96

nnp::Training::US_COMBINED
@ US_COMBINED
One combined updater for all elements.
Definition Training.h:98

nnp::Training::US_ELEMENT
@ US_ELEMENT
Separate updaters for individual elements.
Definition Training.h:100

nnp::Training::getNumConnectionsPerElement
std::vector< std::size_t > getNumConnectionsPerElement(std::string id="short") const
Get number of NN connections for each element.
Definition Training.cpp:3283

nnp::Training::resetNeuronStatistics
void resetNeuronStatistics()
Reset neuron statistics for all elements.
Definition Training.cpp:1962

nnp::Training::calculateWeightDerivatives
std::vector< std::vector< double > > calculateWeightDerivatives(Structure *structure)
Calculate derivatives of energy with respect to weights.
Definition Training.cpp:3174

nnp::Training::calculateError
void calculateError(std::map< std::string, std::pair< std::string, std::string > > const fileNames)
Calculate error metrics for all structures.
Definition Training.cpp:1310

nnp::Training::writeLearningCurve
void writeLearningCurve(bool append, std::string const fileName="learning-curve.out") const
Write current RMSEs and epoch information to file.
Definition Training.cpp:1734

nnp::Training::calculateErrorEpoch
void calculateErrorEpoch()
Calculate error metrics per epoch for all structures with file names used in training loop.
Definition Training.cpp:1515

nnp::Training::pk
std::vector< std::string > pk
Vector of actually used training properties.
Definition Training.h:561

nnp::Training::setEpochSchedule
void setEpochSchedule()
Select energies/forces schedule for one epoch.
Definition Training.cpp:2086

nnp::Training::hasStructures
bool hasStructures
If this rank holds structure information.
Definition Training.h:513

nnp::Training::weights
std::vector< std::vector< double > > weights
Neural network weights and biases for each element.
Definition Training.h:570

nnp::Training::freeMemory
bool freeMemory
Free symmetry function memory after calculation.
Definition Training.h:519

nnp::Training::writeSetsToFiles
void writeSetsToFiles()
Write training and test set to separate files (train.data and test.data, same format as input....
Definition Training.cpp:230

nnp::Training::writeWeights
void writeWeights(std::string const &nnName, std::string const &fileNameFormat) const
Write weights to files (one file for each element).
Definition Training.cpp:1662

nnp::Training::Training
Training()
Constructor.
Definition Training.cpp:38

nnp::Training::setStage
void setStage(std::size_t stage)
Set training stage (if multiple stages are needed for NNP type).
Definition Training.cpp:379

nnp::Training::setupUpdatePlan
void setupUpdatePlan(std::string const &property)
Set up how often properties are updated.
Definition Training.cpp:3839

nnp::Updater
Base class for different weight update methods.
Definition Updater.h:32

mpi-extra.h

MPI_SIZE_T
#define MPI_SIZE_T
Definition mpi-extra.h:22

nnp::settings
Definition ISettings.h:13

nnp
Definition Atom.h:29

nnp::strpr
string strpr(const char *format,...)
String version of printf function.
Definition utility.cpp:90

nnp::createFileHeader
vector< string > createFileHeader(vector< string > const &title, vector< size_t > const &colSize, vector< string > const &colName, vector< string > const &colInfo, char const &commentChar)
Definition utility.cpp:111

nnp::split
vector< string > split(string const &input, char delimiter)
Split string at each delimiter.
Definition utility.cpp:33

nnp::reduce
string reduce(string const &line, string const &whitespace, string const &fill)
Replace multiple whitespaces with fill.
Definition utility.cpp:60

nnp::appendLinesToFile
void appendLinesToFile(ofstream &file, vector< string > const lines)
Append multiple lines of strings to open file stream.
Definition utility.cpp:225

d
double d
Definition nnp-cutoff.cpp:34

nnp::Atom::Neighbor
Struct to store information on neighbor atoms.
Definition Atom.h:36

nnp::Atom::Neighbor::element
std::size_t element
Element index of neighbor atom.
Definition Atom.h:42

nnp::Atom::Neighbor::dGdr
std::vector< Vec3D > dGdr
Derivatives of symmetry functions with respect to neighbor coordinates.
Definition Atom.h:60

nnp::Atom
Storage for a single atom.
Definition Atom.h:33

nnp::Atom::neighbors
std::vector< Neighbor > neighbors
Neighbor array (maximum number defined in macros.h.
Definition Atom.h:170

nnp::Atom::numSymmetryFunctions
std::size_t numSymmetryFunctions
Number of symmetry functions used to describe the atom environment.
Definition Atom.h:113

nnp::Atom::f
Vec3D f
Force vector calculated by neural network.
Definition Atom.h:127

nnp::Atom::charge
double charge
Atomic charge determined by neural network.
Definition Atom.h:121

nnp::Atom::index
std::size_t index
Index number of this atom.
Definition Atom.h:101

nnp::Atom::fRef
Vec3D fRef
Reference force vector from data set.
Definition Atom.h:131

nnp::Atom::dGdr
std::vector< Vec3D > dGdr
Derivative of symmetry functions with respect to this atom's coordinates.
Definition Atom.h:161

nnp::Atom::chi
double chi
Atomic electronegativity determined by neural network.
Definition Atom.h:119

nnp::Atom::element
std::size_t element
Element index of this atom.
Definition Atom.h:107

nnp::Atom::G
std::vector< double > G
Symmetry function values.
Definition Atom.h:146

nnp::Atom::chargeRef
double chargeRef
Atomic reference charge.
Definition Atom.h:123

nnp::Atom::numNeighborsPerElement
std::vector< std::size_t > numNeighborsPerElement
Number of neighbors per element.
Definition Atom.h:138

nnp::Atom::dChidG
std::vector< double > dChidG
Derivative of electronegativity with respect to symmetry functions.
Definition Atom.h:153

nnp::Atom::numNeighbors
std::size_t numNeighbors
Total number of neighbors.
Definition Atom.h:109

nnp::Mode::NNSetup
Setup data for one neural network.
Definition Mode.h:634

nnp::Mode::NNSetup::weightFileFormat
std::string weightFileFormat
Format for weight files.
Definition Mode.h:654

nnp::Mode::NNSetup::keywordSuffix2
std::string keywordSuffix2
Suffix for some other keywords (weight file loading related).
Definition Mode.h:658

nnp::Mode::NNSetup::name
std::string name
Description string for log output, e.g. "electronegativity".
Definition Mode.h:652

nnp::Structure
Storage for one atomic configuration.
Definition Structure.h:39

nnp::Structure::freeAtoms
void freeAtoms(bool all, double const maxCutoffRadius=0.0)
Free symmetry function memory for all atoms, see free() in Atom class.
Definition Structure.cpp:1303

nnp::Structure::ST_TRAINING
@ ST_TRAINING
Structure is part of the training set.
Definition Structure.h:49

nnp::Structure::ST_UNKNOWN
@ ST_UNKNOWN
Sample type not assigned yet.
Definition Structure.h:46

nnp::Structure::ST_TEST
@ ST_TEST
Structure is part of the test set.
Definition Structure.h:55

nnp::Structure::numAtomsPerElement
std::vector< std::size_t > numAtomsPerElement
Number of atoms of each element in this structure.
Definition Structure.h:120

nnp::Structure::calculateDQdChi
void calculateDQdChi(std::vector< Eigen::VectorXd > &dQdChi)
Calculates derivative of the charges with respect to electronegativities.
Definition Structure.cpp:1001

nnp::Structure::index
std::size_t index
Index number of this structure.
Definition Structure.h:73

nnp::Structure::sampleType
SampleType sampleType
Sample type (training or test set).
Definition Structure.h:108

nnp::Structure::calculateDQdJ
void calculateDQdJ(std::vector< Eigen::VectorXd > &dQdJ)
Calculates derivative of the charges with respect to atomic hardness.
Definition Structure.cpp:1016

nnp::Structure::hasAMatrix
bool hasAMatrix
If A matrix of this structure is currently stored.
Definition Structure.h:118

nnp::Structure::calculateDQdr
void calculateDQdr(std::vector< size_t > const &atomsIndices, std::vector< size_t > const &compIndices, double const maxCutoffRadius, std::vector< Element > const &elements)
Calculates derivative of the charges with respect to the atom's position.
Definition Structure.cpp:1035

nnp::Structure::clearElectrostatics
void clearElectrostatics(bool clearDQdr=false)
Clear A-matrix, dAdrQ and optionally dQdr.
Definition Structure.cpp:1368

nnp::Structure::energy
double energy
Potential energy determined by neural network.
Definition Structure.h:83

nnp::Structure::energyRef
double energyRef
Reference potential energy.
Definition Structure.h:85

nnp::Structure::numAtoms
std::size_t numAtoms
Total number of atoms present in this structure.
Definition Structure.h:75

nnp::Structure::atoms
std::vector< Atom > atoms
Vector of all atoms in this structure.
Definition Structure.h:122

nnp::Structure::hasCharges
bool hasCharges
If all charges of this structure have been calculated (and stay the same, e.g.
Definition Structure.h:94

nnp::Training::Property
Specific training quantity (e.g. energies, forces, charges).
Definition Training.h:406

nnp::Training::Property::countGroupedSubCand
std::size_t countGroupedSubCand
Counter for number of used subcandidates belonging to same update candidate.
Definition Training.h:437

nnp::Training::Property::numErrorsGlobal
std::size_t numErrorsGlobal
Global number of errors per update.
Definition Training.h:449

nnp::Training::Property::numTrainPatterns
std::size_t numTrainPatterns
Number of training patterns in set.
Definition Training.h:421

nnp::Training::Property::errorsPerTask
std::vector< int > errorsPerTask
Errors per task for each update.
Definition Training.h:455

nnp::Training::Property::writeCompAlways
std::size_t writeCompAlways
Up to this epoch comparison is written every epoch.
Definition Training.h:429

nnp::Training::Property::property
std::string property
Copy of identifier within Property map.
Definition Training.h:411

nnp::Training::Property::selectionMode
SelectionMode selectionMode
Selection mode for update candidates.
Definition Training.h:419

nnp::Training::Property::numUpdates
std::size_t numUpdates
Number of desired updates per epoch.
Definition Training.h:443

nnp::Training::Property::rmseThreshold
double rmseThreshold
RMSE threshold for update candidates.
Definition Training.h:453

nnp::Training::Property::plural
std::string plural
Plural string of property;.
Definition Training.h:417

nnp::Training::Property::epochFraction
double epochFraction
Desired update fraction per epoch.
Definition Training.h:451

nnp::Training::Property::patternsPerUpdate
std::size_t patternsPerUpdate
Patterns used per update.
Definition Training.h:445

nnp::Training::Property::taskBatchSize
std::size_t taskBatchSize
Batch size for each MPI task.
Definition Training.h:425

nnp::Training::Property::error
std::vector< std::vector< double > > error
Global error vector (per updater).
Definition Training.h:476

nnp::Training::Property::displayMetric
std::string displayMetric
Error metric for display.
Definition Training.h:413

nnp::Training::Property::tiny
std::string tiny
Tiny abbreviation string for property.
Definition Training.h:415

nnp::Training::Property::errorMetrics
std::vector< std::string > errorMetrics
Error metrics available for this property.
Definition Training.h:459

nnp::Training::Property::Property
Property(std::string const &property)
Constructor.
Definition Training.cpp:4085

nnp::Training::Property::offsetJacobian
std::vector< std::vector< int > > offsetJacobian
Stride for Jacobians per task per updater.
Definition Training.h:473

nnp::Training::Property::numTestPatterns
std::size_t numTestPatterns
Number of training patterns in set.
Definition Training.h:423

nnp::Training::Property::countUpdates
std::size_t countUpdates
Counter for updates per epoch.
Definition Training.h:441

nnp::Training::Property::writeCompEvery
std::size_t writeCompEvery
Write comparison every this many epochs.
Definition Training.h:427

nnp::Training::Property::weightsPerTask
std::vector< std::vector< int > > weightsPerTask
Weights per task per updater.
Definition Training.h:470

nnp::Training::Property::numGroupedSubCand
std::size_t numGroupedSubCand
Number of subcandidates which are considered before changing the update candidate.
Definition Training.h:434

nnp::Training::Property::offsetPerTask
std::vector< int > offsetPerTask
Offset for combined error per task.
Definition Training.h:457

nnp::Training::Property::updateCandidates
std::vector< UpdateCandidate > updateCandidates
Vector with indices of training patterns.
Definition Training.h:467

nnp::Training::Property::errorTrain
std::map< std::string, double > errorTrain
Current error metrics of training patterns.
Definition Training.h:462

nnp::Training::Property::jacobian
std::vector< std::vector< double > > jacobian
Global Jacobian (per updater).
Definition Training.h:479

nnp::Training::Property::patternsPerUpdateGlobal
std::size_t patternsPerUpdateGlobal
Patterns used per update (summed over all MPI tasks).
Definition Training.h:447

nnp::Training::Property::errorTest
std::map< std::string, double > errorTest
Current error metrics of test patterns.
Definition Training.h:465

nnp::Training::Property::rmseThresholdTrials
std::size_t rmseThresholdTrials
Maximum trials for SM_THRESHOLD selection mode.
Definition Training.h:439

nnp::Training::Property::posUpdateCandidates
std::size_t posUpdateCandidates
Current position in update candidate list (SM_SORT/_THRESHOLD).
Definition Training.h:431

nnp::Training::SubCandidate
Contains update candidate which is grouped with others to specific parent update candidate (e....
Definition Training.h:370

nnp::Training::SubCandidate::a
std::size_t a
Atom index (only used for force candidates).
Definition Training.h:372

nnp::Training::SubCandidate::c
std::size_t c
Component index (x,y,z -> 0,1,2, only used for force candidates).
Definition Training.h:374

nnp::Training::UpdateCandidate
Contains location of one update candidate (energy or force).
Definition Training.h:385

nnp::Training::UpdateCandidate::subCandidates
std::vector< SubCandidate > subCandidates
Vector containing grouped candidates.
Definition Training.h:396

nnp::Training::UpdateCandidate::posSubCandidates
std::size_t posSubCandidates
Current position in sub-candidate list (SM_SORT/_THRESHOLD).
Definition Training.h:392

nnp::Training::UpdateCandidate::s
std::size_t s
Structure index.
Definition Training.h:387

utility.h