n2p2 - A neural network potential package
Loading...
Searching...
No Matches
Settings.cpp
Go to the documentation of this file.
1// n2p2 - A neural network potential package
2// Copyright (C) 2018 Andreas Singraber (University of Vienna)
3//
4// This program is free software: you can redistribute it and/or modify
5// it under the terms of the GNU General Public License as published by
6// the Free Software Foundation, either version 3 of the License, or
7// (at your option) any later version.
8//
9// This program is distributed in the hope that it will be useful,
10// but WITHOUT ANY WARRANTY; without even the implied warranty of
11// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
12// GNU General Public License for more details.
13//
14// You should have received a copy of the GNU General Public License
15// along with this program. If not, see <https://www.gnu.org/licenses/>.
16
17#include "Settings.h"
18#include "utility.h"
19#include <fstream> // std::ifstream
20#include <stdexcept> // std::runtime_error
21#include <tuple> // std::tie
22
23using namespace std;
24using namespace nnp;
25using namespace settings;
26
27map<string, shared_ptr<settings::Key>> const createKnownKeywordsMap()
28{
29 // Main keyword names and descriptions.
30 map<string, string> m;
31 // Alternative names.
32 map<string, vector<string>> a;
33 // Complete keyword map to return.
34 map<string, shared_ptr<settings::Key>> r;
35
36 // Required for prediction.
37 m["number_of_elements" ] = "";
38 m["elements" ] = "";
39 m["atom_energy" ] = "";
40 m["cutoff_type" ] = "";
41 m["symfunction_short" ] = "";
42 m["scale_symmetry_functions" ] = "";
43 m["scale_min_short" ] = "";
44 m["scale_max_short" ] = "";
45 m["center_symmetry_functions" ] = "";
46 m["scale_symmetry_functions_sigma" ] = "";
47 m["global_hidden_layers_short" ] = "";
48 m["global_hidden_layers_electrostatic" ] = "";
49 m["global_nodes_short" ] = "";
50 m["global_nodes_electrostatic" ] = "";
51 m["global_activation_short" ] = "";
52 m["global_activation_electrostatic" ] = "";
53 m["element_hidden_layers_short" ] = "";
54 m["element_hidden_layers_electrostatic"] = "";
55 m["element_nodes_short" ] = "";
56 m["element_nodes_electrostatic" ] = "";
57 m["element_activation_short" ] = "";
58 m["element_activation_electrostatic" ] = "";
59 m["normalize_nodes" ] = "";
60 m["mean_energy" ] = "";
61 m["conv_length" ] = "";
62 m["conv_energy" ] = "";
63 m["conv_charge" ] = "";
64 m["nnp_type" ] = "";
65 m["fixed_gausswidth" ] = "";
66 m["ewald_truncation_error_method" ] = "";
67 m["kspace_solver" ] = "";
68 m["ewald_prec" ] = "";
69 m["screen_electrostatics" ] = "";
70 m["four_pi_epsilon" ] = "";
71
72 // Training keywords.
73 m["random_seed" ] = "";
74 m["test_fraction" ] = "";
75 m["epochs" ] = "";
76 m["normalize_data_set" ] = "";
77 m["use_short_forces" ] = "";
78 m["rmse_threshold" ] = "";
79 m["rmse_threshold_energy" ] = "";
80 m["rmse_threshold_force" ] = "";
81 m["rmse_threshold_charge" ] = "";
82 m["rmse_threshold_trials" ] = "";
83 m["rmse_threshold_trials_energy" ] = "";
84 m["rmse_threshold_trials_force" ] = "";
85 m["rmse_threshold_trials_charge" ] = "";
86 m["energy_fraction" ] = "";
87 m["force_fraction" ] = "";
88 m["force_energy_ratio" ] = "";
89 m["charge_fraction" ] = "";
90 m["use_old_weights_short" ] = "";
91 m["use_old_weights_charge" ] = "";
92 m["weights_min" ] = "";
93 m["weights_max" ] = "";
94 m["initial_hardness" ] = "";
95 m["nguyen_widrow_weights_short" ] = "";
96 m["nguyen_widrow_weights_charge" ] = "";
97 m["precondition_weights" ] = "";
98 m["main_error_metric" ] = "";
99 m["write_trainpoints" ] = "";
100 m["write_trainforces" ] = "";
101 m["write_traincharges" ] = "";
102 m["write_weights_epoch" ] = "";
103 m["write_neuronstats" ] = "";
104 m["write_trainlog" ] = "";
105 m["repeated_energy_update" ] = "";
106 m["updater_type" ] = "";
107 m["parallel_mode" ] = "";
108 m["jacobian_mode" ] = "";
109 m["update_strategy" ] = "";
110 m["selection_mode" ] = "";
111 m["selection_mode_energy" ] = "";
112 m["selection_mode_force" ] = "";
113 m["selection_mode_charge" ] = "";
114 m["task_batch_size_energy" ] = "";
115 m["task_batch_size_force" ] = "";
116 m["task_batch_size_charge" ] = "";
117 m["gradient_type" ] = "";
118 m["gradient_eta" ] = "";
119 m["gradient_adam_eta" ] = "";
120 m["gradient_adam_beta1" ] = "";
121 m["gradient_adam_beta2" ] = "";
122 m["gradient_adam_epsilon" ] = "";
123 m["kalman_type" ] = "";
124 m["kalman_epsilon" ] = "";
125 m["kalman_eta" ] = "";
126 m["kalman_etatau" ] = "";
127 m["kalman_etamax" ] = "";
128 m["kalman_q0" ] = "";
129 m["kalman_qtau" ] = "";
130 m["kalman_qmin" ] = "";
131 m["kalman_lambda_short" ] = "";
132 m["kalman_nue_short" ] = "";
133 m["memorize_symfunc_results" ] = "";
134 m["force_weight" ] = "";
135
136 // Alternative keyword names.
137 a["nnp_type" ] = {"nnp_generation", "nnp_type_gen", "nnp_gen"};
138 a["rmse_threshold_energy"] = {"short_energy_error_threshold"};
139 a["rmse_threshold_force" ] = {"short_force_error_threshold"};
140 a["energy_fraction" ] = {"short_energy_fraction"};
141 a["force_fraction" ] = {"short_force_fraction"};
142 a["symfunction_short" ] = {"symfunction"};
143
144 for (auto im : m)
145 {
146 // Check if keyword was already inserted.
147 if (r.find(im.first) != r.end())
148 {
149 throw runtime_error("ERROR: Multiple definition of keyword.\n");
150 }
151 // Insert new shared pointer to a Key object.
152 r[im.first] = make_shared<settings::Key>();
153 // Add main keyword as first entry in alternatives list.
154 r.at(im.first)->addAlternative(im.first);
155 // Add description text.
156 r.at(im.first)->setDescription(im.second);
157 // Check if alternative keywords exist.
158 if (a.find(im.first) != a.end())
159 {
160 // Loop over all alternative keywords.
161 for (auto alt : a.at(im.first))
162 {
163 // Check if alternative keyword is already inserted.
164 if (r.find(alt) != r.end())
165 {
166 throw runtime_error("ERROR: Multiple definition of "
167 "alternative keyword.\n");
168 }
169 // Set map entry, i.e. shared pointer, to Key object.
170 r[alt] = r.at(im.first);
171 // Add alternative keyword to list.
172 r[alt]->addAlternative(alt);
173 }
174 }
175 }
176
177 return r;
178}
179
181
182string Settings::operator[](string const& keyword) const
183{
184 return getValue(keyword);
185}
186
187
188size_t Settings::loadFile(string const& fileName)
189{
190 this->fileName = fileName;
191
192 readFile();
193 return parseLines();
194}
196 bool const exact) const
197{
198 return keywordExists(key.getMainKeyword(), exact);
199}
200bool Settings::keywordExists(string const& keyword, bool exact) const
201{
202 if (knownKeywords.find(keyword) == knownKeywords.end())
203 {
204 throw runtime_error("ERROR: Not in the list of allowed keyword: \"" +
205 keyword + "\".\n");
206 }
207 if (exact || knownKeywords.at(keyword)->hasUniqueKeyword())
208 {
209 return (contents.find(keyword) != contents.end());
210 }
211 else
212 {
213 for (auto alternative : *knownKeywords.at(keyword))
214 {
215 if (contents.find(alternative) != contents.end()) return true;
216 }
217 }
218
219 return false;
220}
221
222string Settings::keywordCheck(string const& keyword) const
223{
224 bool exists = keywordExists(keyword, false);
225 bool unique = knownKeywords.at(keyword)->hasUniqueKeyword();
226 if (!exists)
227 {
228 if (unique)
229 {
230 throw std::runtime_error("ERROR: Keyword \"" + keyword
231 + "\" not found.\n");
232 }
233 else
234 {
235 throw std::runtime_error("ERROR: Neither keyword \"" + keyword
236 + "\" nor alternative keywords found.\n");
237 }
238 }
239
240 bool exact = keywordExists(keyword, true);
241 if (!exact)
242 {
243 for (auto const& alt : *knownKeywords.at(keyword))
244 {
245 if (contents.find(alt) != contents.end()) return alt;
246 }
247 }
248
249 return keyword;
250}
251
252string Settings::getValue(Key const& key) const
253{
254 return contents.find(key.getMainKeyword())->second.first;
255}
256
257string Settings::getValue(string const& keyword) const
258{
259 return contents.find(keywordCheck(keyword))->second.first;
260}
261
262Settings::KeyRange Settings::getValues(string const& keyword) const
263{
264 return contents.equal_range(keywordCheck(keyword));
265}
266
267vector<string> Settings::info() const
268{
269 return log;
270}
271
272vector<string> Settings::getSettingsLines() const
273{
274 return lines;
275}
276
278{
279 ifstream file;
280 string line;
281
282 log.push_back(strpr("Settings file name: %s\n", fileName.c_str()));
283 file.open(fileName.c_str());
284 if (!file.is_open())
285 {
286 throw runtime_error("ERROR: Could not open file: \"" + fileName
287 + "\".\n");
288 }
289
290 while (getline(file, line))
291 {
292 lines.push_back(line);
293 }
294
295 file.close();
296
297 log.push_back(strpr("Read %zu lines.\n", lines.size()));
298
299 return;
300}
301
302void Settings::writeSettingsFile(ofstream* const& file,
303 map<size_t, string> const& replacements) const
304{
305 if (!file->is_open())
306 {
307 runtime_error("ERROR: Could not write to file.\n");
308 }
309
310 size_t i = 0;
311 for (auto const& l : lines)
312 {
313 if (replacements.find(i) != replacements.end())
314 {
315 (*file) << replacements.at(i);
316 }
317 else (*file) << l << '\n';
318 i++;
319 }
320
321 return;
322}
323
325{
326 for (size_t i = 0; i < lines.size(); ++i)
327 {
328 string line = lines.at(i);
329
330 // ignore empty and comment lines
331 if (line.empty())
332 {
333 continue;
334 }
335 // check for empty lines in Windows format
336 if (line == "\r")
337 {
338 continue;
339 }
340 if (line.find('#') != string::npos)
341 {
342 line.erase(line.find('#'));
343 }
344 if (line.find('!') != string::npos)
345 {
346 line.erase(line.find('!'));
347 }
348 if (line.find_first_not_of(' ') == string::npos)
349 {
350 continue;
351 }
352
353 // remove leading and trailing whitespaces and trim separating spaces
354 line = reduce(line);
355
356 // find separator position
357 size_t const separatorPosition = line.find_first_of(" ");
358 string key;
359 pair<string, size_t> value;
360
361 if (separatorPosition == string::npos)
362 {
363 // first check for single keyword without value
364 key = line;
365 value = pair<string, size_t>("", i);
366 }
367 else
368 {
369 // one or more arguments
370 key = line.substr(0, separatorPosition);
371 value = pair<string, size_t>(line.erase(0, separatorPosition + 1),
372 i);
373 }
374
375 contents.insert(pair<string, pair<string, size_t> >(key, value));
376 }
377
378 size_t numProblems = 0;
379 size_t numCritical = 0;
380 tie(numProblems, numCritical) = sanityCheck();
381 if (numProblems > 0)
382 {
383 log.push_back(strpr("WARNING: %zu problems detected (%zu critical).\n",
384 numProblems, numCritical));
385 }
386
387 log.push_back(strpr("Found %zu lines with keywords.\n", contents.size()));
388
389 return numCritical;
390}
391
392pair<size_t, size_t> Settings::sanityCheck()
393{
394 size_t countProblems = 0;
395 size_t countCritical = 0;
396
397 // check for unknown keywords
398 for (multimap<string, pair<string, size_t> >::const_iterator
399 it = contents.begin(); it != contents.end(); ++it)
400 {
401 if (knownKeywords.find((*it).first) == knownKeywords.end())
402 {
403 countProblems++;
404 log.push_back(strpr(
405 "WARNING: Unknown keyword \"%s\" at line %zu.\n",
406 (*it).first.c_str(),
407 (*it).second.second + 1));
408 }
409 }
410
411 // check for multiple instances of known keywords (with exceptions)
412 for (KeywordList::const_iterator it = knownKeywords.begin();
413 it != knownKeywords.end(); ++it)
414 {
415 if (contents.count((*it).first) > 1
416 && (*it).first != "symfunction"
417 && (*it).first != "symfunction_short"
418 && (*it).first != "atom_energy"
419 && (*it).first != "element_nodes_short"
420 && (*it).first != "fixed_gausswidth"
421 && (*it).first != "initial_hardness")
422 {
423 countProblems++;
424 countCritical++;
425 log.push_back(strpr(
426 "WARNING (CRITICAL): Multiple instances of \"%s\" detected.\n",
427 (*it).first.c_str()));
428 }
429 }
430
431 // Check for usage of multiple keyword versions.
432 for (KeywordList::const_iterator it = knownKeywords.begin();
433 it != knownKeywords.end(); ++it)
434 {
435 if (it->second->hasUniqueKeyword()) continue;
436 vector<string> duplicates;
437 for (auto keyword : *it->second)
438 {
439 if (contents.find(keyword) != contents.end())
440 {
441 duplicates.push_back(keyword);
442 }
443 }
444 if (duplicates.size() > 1)
445 {
446 countProblems++;
447 countCritical++;
448 log.push_back(strpr(
449 "WARNING (CRITICAL): Multiple alternative versions of keyword "
450 "\"%s\" detected:.\n", (*it).first.c_str()));
451 for (auto d : duplicates)
452 {
453 log.push_back(strpr(
454 " - \"%s\"\n", d.c_str()));
455 }
456 }
457 }
458
459 return make_pair(countProblems, countCritical);
460}
map< string, shared_ptr< settings::Key > > const createKnownKeywordsMap()
Definition Settings.cpp:27
Keyword properties.
Definition Key.h:18
std::string getMainKeyword() const
Definition Key.h:20
std::vector< std::string > info() const
Get logged information about settings file.
Definition Settings.cpp:267
std::string keywordCheck(std::string const &keyword) const
Check for keyword and alternatives, throw exception if not present.
Definition Settings.cpp:222
static KeywordList knownKeywords
Map containing all known keywords and a description.
Definition Settings.h:149
std::vector< std::string > lines
Vector of all lines in settings file.
Definition Settings.h:143
std::string getValue(Key const &key) const override
Definition Settings.cpp:252
void writeSettingsFile(std::ofstream *const &file, std::map< std::size_t, std::string > const &replacements={}) const
Write complete settings file.
Definition Settings.cpp:302
std::pair< KeyMap::const_iterator, KeyMap::const_iterator > KeyRange
Definition Settings.h:44
std::size_t loadFile(std::string const &fileName="input.nn")
Load a file with settings.
Definition Settings.cpp:188
std::map< std::string, std::shared_ptr< Key > > const KeywordList
Definition Settings.h:46
KeyRange getValues(std::string const &keyword) const
Get all keyword-value pairs for given keyword.
Definition Settings.cpp:262
std::vector< std::string > log
Vector with log lines.
Definition Settings.h:145
std::string fileName
Settings file name.
Definition Settings.h:151
KeyMap contents
Map containing all keyword-value pairs.
Definition Settings.h:147
std::vector< std::string > getSettingsLines() const
Get complete settings file.
Definition Settings.cpp:272
bool keywordExists(Key const &key, bool const exact=false) const override
Definition Settings.cpp:195
std::size_t parseLines()
Parse lines and create contents map.
Definition Settings.cpp:324
void readFile()
Read file once and save all lines in lines vector.
Definition Settings.cpp:277
std::pair< std::size_t, std::size_t > sanityCheck()
Check if all keywords are in known-keywords database and for duplicates.
Definition Settings.cpp:392
std::string operator[](std::string const &keyword) const
Overload [] operator.
Definition Settings.cpp:182
Definition Atom.h:29
string strpr(const char *format,...)
String version of printf function.
Definition utility.cpp:90
string reduce(string const &line, string const &whitespace, string const &fill)
Replace multiple whitespaces with fill.
Definition utility.cpp:60
double d