Merge branch 'pod' of https://github.com/cesmix-mit/lammps into pod

2022-10-12 21:24:46 -04:00
parent 5fbedfb492 2c9396fb25
commit 440724f73a
4 changed files with 1328 additions and 2425 deletions
--- a/src/ML-POD/compute_podfit.cpp
+++ b/src/ML-POD/compute_podfit.cpp
@ -35,8 +35,6 @@
 #define _USE_MATH_DEFINES
 #include <math.h>

-using std::cout;
-using std::endl;
 using std::string;
 using std::ios;
 using std::ofstream;
@ -278,23 +276,23 @@ void CPODFIT::read_data_file(double *fitting_weights, std::string &file_format,
  }    
  file_in.close();
  
-  std::cout<<"**************** Begin of Data File ****************"<<std::endl;
-  std::cout<<"file format: "<<file_format<<std::endl;
-  std::cout<<"file extension: "<<file_extension<<std::endl;
-  std::cout<<"path to training data set: "<<training_path<<std::endl;
-  std::cout<<"path to test data set: "<<test_path<<std::endl;  
-  std::cout<<"training percentage: "<<fitting_weights[7]<<std::endl;
-  std::cout<<"test percentage: "<<fitting_weights[8]<<std::endl;
-  std::cout<<"randomize training data set: "<<fitting_weights[9]<<std::endl;
-  std::cout<<"randomize test data set: "<<fitting_weights[10]<<std::endl;
-  std::cout<<"error analysis for training data set: "<<fitting_weights[3]<<std::endl;
-  std::cout<<"error analysis for test data set: "<<fitting_weights[4]<<std::endl;
-  std::cout<<"energy/force calculation for training data set: "<<fitting_weights[5]<<std::endl;
-  std::cout<<"energy/force calculation for test data set: "<<fitting_weights[6]<<std::endl;
-  std::cout<<"fitting weight for energy: "<<fitting_weights[0]<<std::endl;
-  std::cout<<"fitting weight for force: "<<fitting_weights[1]<<std::endl;
-  std::cout<<"fitting weight for stress: "<<fitting_weights[2]<<std::endl;  
-  std::cout<<"**************** End of Data File ****************"<<std::endl<<std::endl;
+  utils::logmesg(lmp, "**************** Begin of Data File ****************\n");
+  utils::logmesg(lmp, "file format: {}\n", file_format);
+  utils::logmesg(lmp, "file extension: {}\n", file_extension);
+  utils::logmesg(lmp, "path to training data set: {}\n", training_path);
+  utils::logmesg(lmp, "path to test data set: {}\n", test_path);
+  utils::logmesg(lmp, "training percentage: {}\n", fitting_weights[7]);
+  utils::logmesg(lmp, "test percentage: {}\n", fitting_weights[8]);
+  utils::logmesg(lmp, "randomize training data set: {}\n", fitting_weights[9]);
+  utils::logmesg(lmp, "randomize test data set: {}\n", fitting_weights[10]);
+  utils::logmesg(lmp, "error analysis for training data set: {}\n", fitting_weights[3]);
+  utils::logmesg(lmp, "error analysis for test data set: {}\n", fitting_weights[4]);
+  utils::logmesg(lmp, "energy/force calculation for training data set: {}\n", fitting_weights[5]);
+  utils::logmesg(lmp, "energy/force calculation for test data set: {}\n", fitting_weights[6]);
+  utils::logmesg(lmp, "fitting weight for energy: {}\n", fitting_weights[0]);
+  utils::logmesg(lmp, "fitting weight for force: {}\n", fitting_weights[1]);
+  utils::logmesg(lmp, "fitting weight for stress: {}\n", fitting_weights[2]);
+  utils::logmesg(lmp, "**************** End of Data File ****************\n");
 }

 std::vector<std::string> CPODFIT::globVector(const std::string& pattern, std::vector<std::string> & files)
@ -437,16 +435,15 @@ void CPODFIT::get_data(datastruct &data, std::vector<std::string> species)
  data.num_atom_sum = this->get_number_atoms(data.num_atom, data.num_atom_each_file, data.num_config, data.data_files);      
  data.num_config_sum = data.num_atom.size();
  
-  std::cout<<"data file   |  number of configurations   |   number of atoms "<<std::endl;
+  utils::logmesg(lmp, "data file   |  number of configurations   |   number of atoms\n");
  for (int i=0; i< (int) data.data_files.size(); i++) {
    string filename = data.data_files[i].substr(data.data_path.size()+1,data.data_files[i].size());
-    data.filenames.push_back(filename.c_str());                    
-    std::cout<<data.filenames[i]<<"   |   "<<data.num_config[i]<<"   |   "<<data.num_atom_each_file[i]<< std::endl;  
-    //std::cout<<data.data_files[i].substr(data.data_path.size()+1,data.data_files[i].size())<<std::endl;
+    data.filenames.push_back(filename.c_str());
+    utils::logmesg(lmp, "{}   |   {}   |   {}\n", data.filenames[i], data.num_config[i], data.num_atom_each_file[i]);
  }  
-  std::cout << "number of files: " <<data.data_files.size() << std::endl;   
-  std::cout << "number of configurations in all files: " <<data.num_config_sum << std::endl;   
-  std::cout << "number of atoms in all files: " <<data.num_atom_sum << std::endl;     
+  utils::logmesg(lmp, "number of files: {}\n", data.data_files.size());
+  utils::logmesg(lmp, "number of configurations in all files: {}\n", data.num_config_sum);
+  utils::logmesg(lmp, "number of atoms in all files: {}\n", data.num_atom_sum);    
  
  int n = data.num_config_sum;
  data.lattice = (double *) malloc(9*n*sizeof(double));
@ -497,8 +494,8 @@ void CPODFIT::get_data(datastruct &data, std::vector<std::string> species)
    podptr->matrix33_multiplication(f, Qmat, f, natom);   
  }
    
-  std::cout << "minimum number of atoms: " <<data.num_atom_min << std::endl;   
-  std::cout << "maximum number of atoms: " <<data.num_atom_max << std::endl;   
+  utils::logmesg(lmp, "minimum number of atoms: {}\n", data.num_atom_min);
+  utils::logmesg(lmp, "maximum number of atoms: {}\n", data.num_atom_max); 
 }

 std::vector<int> CPODFIT::linspace(int start_in, int end_in, int num_in)
@ -571,10 +568,10 @@ void CPODFIT::select_data(datastruct &newdata, datastruct data)
  double percentage = data.percentage;
  int randomize = data.randomize;    
    
-  if (randomize==1) 
-    std::cout << "Select " <<data.percentage*100 <<" percent of the data set at random using shuffle"<< std::endl;   
+  if (randomize==1)
+    utils::logmesg(lmp, "Select {} percent of the data set at random using shuffle\n", data.percentage*100); 
  else 
-    std::cout << "Select " <<data.percentage*100 <<" percent of the data set deterministically using linspace"<< std::endl;   
+    utils::logmesg(lmp, "Select {} percent of the data set deterministically using linspace\n", data.percentage*100); 

  int nfiles = data.data_files.size();  // number of files  
  std::vector<std::vector<int>> selected(nfiles);
@ -658,15 +655,15 @@ void CPODFIT::select_data(datastruct &newdata, datastruct data)
  
  data.copydatainfo(newdata);  

-  std::cout<<"data file  | # configurations (selected) | # atoms (selected) | # configurations (original) | # atoms (original) "<<std::endl;
+  utils::logmesg(lmp, "data file  | # configs (selected) | # atoms (selected) | # configs (original) | # atoms (original)\n");
  for (int i=0; i< (int) newdata.data_files.size(); i++) {
    string filename = newdata.data_files[i].substr(newdata.data_path.size()+1,newdata.data_files[i].size());
-    newdata.filenames.push_back(filename.c_str());                    
-    std::cout<<newdata.filenames[i]<<"   |   "<<newdata.num_config[i]<<"   |   "<<newdata.num_atom_each_file[i]<<"   |   "<<data.num_config[i]<<"   |   "<<data.num_atom_each_file[i]<< std::endl;  
-  }  
-  std::cout << "number of files: " <<newdata.data_files.size() << std::endl;   
-  std::cout << "number of configurations in all files (selected and original): " <<newdata.num_config_sum<<" and "<<data.num_config_sum << std::endl;   
-  std::cout << "number of atoms in all files (selected and original): "<<newdata.num_atom_sum <<" and "<< data.num_atom_sum << std::endl;      
+    newdata.filenames.push_back(filename.c_str());
+    utils::logmesg(lmp, "{}   |   {}   |   {}   |   {}   |   {}\n", newdata.filenames[i], newdata.num_config[i], newdata.num_atom_each_file[i], data.num_config[i], data.num_atom_each_file[i]);              
+  }
+  utils::logmesg(lmp, "number of files: {}\n", newdata.data_files.size());
+  utils::logmesg(lmp, "number of configurations in all files (selected and original): {} and {}\n", newdata.num_config_sum, data.num_config_sum);
+  utils::logmesg(lmp, "number of atoms in all files (selected and original: {} and {}\n", newdata.num_atom_sum, data.num_atom_sum);    
 }

 void CPODFIT::read_data_files(std::string data_file, std::vector<std::string> species)
@ -686,25 +683,25 @@ void CPODFIT::read_data_files(std::string data_file, std::vector<std::string> sp
  
  data.copydatainfo(traindata); 
  
-  if (data.percentage >= 1.0) {         
-    std::cout<<"**************** Begin of Training Data Set ****************"<<std::endl;    
+  if (data.percentage >= 1.0) {        
+    utils::logmesg(lmp, "**************** Begin of Training Data Set ****************\n");  
    if ((int) traindata.data_path.size() > 1) 
      this->get_data(traindata, species);
    else 
-      error->all(FLERR,"data set is not found");          
-    std::cout<<"**************** End of Training Data Set ****************"<<std::endl<<std::endl;          
+      error->all(FLERR,"data set is not found");     
+    utils::logmesg(lmp, "**************** End of Training Data Set ****************\n");               
  }
  else {
-    std::cout<<"**************** Begin of Training Data Set ****************"<<std::endl;    
+    utils::logmesg(lmp, "**************** Begin of Training Data Set ****************\n");    
    if ((int) data.data_path.size() > 1) 
      this->get_data(data, species);
    else 
      error->all(FLERR,"data set is not found");            
-    std::cout<<"**************** End of Training Data Set ****************"<<std::endl<<std::endl;          
+    utils::logmesg(lmp, "**************** End of Training Data Set ****************\n");          
    
-    std::cout<<"**************** Begin of Select Training Data Set ****************"<<std::endl;
-    select_data(traindata, data);    
-    std::cout<<"**************** End of Select Training Data Set ****************"<<std::endl<<std::endl;
+    utils::logmesg(lmp, "**************** Begin of Select Training Data Set ****************\n");
+    select_data(traindata, data);
+    utils::logmesg(lmp, "**************** End of Select Training Data Set ****************\n");
    
    data.freememory(1);
  }
@ -718,10 +715,10 @@ void CPODFIT::read_data_files(std::string data_file, std::vector<std::string> sp
    testdata.training_calculation = traindata.training_calculation;
    testdata.test_calculation = traindata.test_calculation;
    testdata.percentage = traindata.fitting_weights[8];
-    testdata.randomize = (int) traindata.fitting_weights[10];    
-    std::cout<<"**************** Begin of Test Data Set ****************"<<std::endl;
+    testdata.randomize = (int) traindata.fitting_weights[10];   
+    utils::logmesg(lmp, "**************** Begin of Test Data Set ****************\n");
    this->get_data(testdata, species);
-    std::cout<<"**************** End of Test Data Set ****************"<<std::endl<<std::endl;  
+    utils::logmesg(lmp, "**************** End of Test Data Set ****************\n"); 
  }
  else {
    testdata.data_path = traindata.data_path;
@ -878,7 +875,7 @@ void CPODFIT::allocate_memory(datastruct data)
  nb.szy = ny;  
  nb.szp = np;  
  
-  std::cout<<"**************** Begin of Memory Allocation ****************"<<std::endl;
+  utils::logmesg(lmp,"**************** Begin of Memory Allocation ****************\n");
  
  int szd = 0, szi=0, szsnap=0;
  for (int ci=0; ci<(int) data.num_atom.size(); ci++)
@ -931,13 +928,13 @@ void CPODFIT::allocate_memory(datastruct data)
  desc.szd = szd;
  desc.szi = szi;    

-  std::cout<<"maximum number of atoms in periodic domain: "<<natom_max<<std::endl;
-  std::cout<<"maximum number of atoms in extended domain: "<<nb.sza<<std::endl;
-  std::cout<<"maximum number of neighbors in extended domain: "<<nb.szp<<std::endl;
-  std::cout<<"size of double memory: "<<szd<<std::endl;
-  std::cout<<"size of int memory: "<<szi<<std::endl;
-  std::cout<<"size of descriptor matrix: "<<nd<<" x "<<nd<<std::endl;
-  std::cout<<"**************** End of Memory Allocation ****************"<<std::endl<<std::endl;
+  utils::logmesg(lmp, "maximum number of atoms in periodic domain: {}\n", natom_max);
+  utils::logmesg(lmp, "maximum number of atoms in extended domain: {}\n", nb.sza);
+  utils::logmesg(lmp, "maximum number of neighbors in extended domain: {}\n", nb.szp);
+  utils::logmesg(lmp, "size of double memory: {}\n", szd);
+  utils::logmesg(lmp, "size of int memory: {}\n", szi);
+  utils::logmesg(lmp, "size of descriptor matrix: {} x {}\n", nd, nd);
+  utils::logmesg(lmp, "**************** End of Memory Allocation ****************\n");
 }

 void CPODFIT::linear_descriptors(datastruct data, int ci)
@ -1167,12 +1164,12 @@ void CPODFIT::least_squares_matrix(datastruct data, int ci)

 void CPODFIT::least_squares_fit(datastruct data)
 {    
-  std::cout<<"**************** Begin of Least-Squares Fitting ****************"<<std::endl;
+  utils::logmesg(lmp, "**************** Begin of Least-Squares Fitting ****************\n");
  
  // loop over each configuration in the training data set

  for (int ci=0; ci < (int) data.num_atom.size(); ci++) {
-    if ((ci % 100)==0) std::cout<<"Configuration: # "<<ci+1<<std::endl;
+    if ((ci % 100)==0) utils::logmesg(lmp, "Configuration: # {}\n", ci+1);
    
    // compute linear POD descriptors

@ -1216,9 +1213,9 @@ void CPODFIT::least_squares_fit(datastruct data)
      myfile << std::setprecision(20)<< desc.c[count] << std::endl;    
    myfile.close();
  }
-  else std::cout << "Unable to open file";
+  else utils::logmesg(lmp, "Unable to open file\n");
  
-  std::cout<<"**************** End of Least-Squares Fitting ****************"<<std::endl<<std::endl;
+  utils::logmesg(lmp, "**************** End of Least-Squares Fitting ****************\n");
 }

 double CPODFIT::energyforce_calculation(double *force, double *coeff, datastruct data, int ci)
@ -1272,23 +1269,26 @@ void CPODFIT::print_analysis(datastruct data, double *outarray, double *errors)
  
  std::string filename = data.training ? "training_errors.txt" : "test_errors.txt";   
  std::ofstream myfile (filename);
-  if (!myfile.is_open()) std::cout << "Unable to open file";
+  if (!myfile.is_open()) utils::logmesg(lmp, "Unable to open file");
  
  filename = data.training ? "training_analysis.txt" : "test_analysis.txt";
  std::ofstream mfile (filename);
-  if (!mfile.is_open()) std::cout << "Unable to open file";
+  if (!mfile.is_open()) utils::logmesg(lmp, "Unable to open file");
    
  std::string sa = "**************** Begin of Error Analysis for the Training Data Set ****************";
  std::string sb = "**************** Begin of Error Analysis for the Test Data Set ****************";      
-  std::string mystr = (data.training) ? sa : sb;  
-  std::cout<<mystr<<std::endl;      
+  std::string mystr = (data.training) ? sa : sb;   
+  utils::logmesg(lmp, "{}\n", mystr);    
  myfile <<mystr+"\n";
  
  sa = "----------------------------------------------------------------------------------------\n";
  sb = "  File    | # configs | # atoms  | MAE energy | RMSE energy | MAE force | RMSE force |\n";
-  std::cout<<sa; myfile <<sa;
-  std::cout<<sb; myfile <<sb;
-  std::cout<<sa; myfile <<sa;   
+  utils::logmesg(lmp, "{}", sa); 
+  utils::logmesg(lmp, "{}", sb);
+  utils::logmesg(lmp, "{}", sa);
+  myfile << sa;
+  myfile << sb;
+  myfile << sa;   
  
  int ci=0, m=8, nc=0, nf=0;  
  for (int file = 0; file < nfiles; file++) {    
@ -1332,10 +1332,11 @@ void CPODFIT::print_analysis(datastruct data, double *outarray, double *errors)
    s1 = std::to_string(errors[3 + 4*q]);
    s1 = s1 + std::string(PODMAX(10 - (int) s1.size(),1), ' ');  
    s = s + "   " + s1 + "\n";    
-    std::cout<<s; 
+    utils::logmesg(lmp, "{}", s);
    myfile <<s;    
  }
-  std::cout<<sa; myfile <<sa;
+  utils::logmesg(lmp, "{}", sa);
+  myfile << sa;
    
  s = s + std::string(PODMAX(lm - (int) s.size(),1), ' ');     
  string s1 = std::to_string(nc);
@ -1355,14 +1356,16 @@ void CPODFIT::print_analysis(datastruct data, double *outarray, double *errors)
  s = s + "   " + s1;
  s1 = std::to_string(errors[3]);
  s1 = s1 + std::string(PODMAX(10 - (int) s1.size(),1), ' ');  
-  s = s + "   " + s1 + "\n";    
-  std::cout<<s; myfile <<s;
-  std::cout<<sa; myfile <<sa;
+  s = s + "   " + s1 + "\n";  
+  utils::logmesg(lmp, "{}", s);
+  utils::logmesg(lmp, "{}", sa);
+  myfile << s;
+  myfile << sa;
  
  sa = "**************** End of Error Analysis for the Training Data Set ****************";    
  sb = "**************** End of Error Analysis for the Test Data Set ****************";   
-  mystr = (data.training) ? sa : sb;  
-  std::cout<<mystr<<std::endl;      
+  mystr = (data.training) ? sa : sb;       
+  utils::logmesg(lmp, "{}\n", mystr); 
  myfile <<mystr+"\n";  
  myfile.close();
  mfile.close();  
@ -1404,7 +1407,7 @@ void CPODFIT::error_analsysis(datastruct data, double *coeff)
  for (int j=0; j<nd; j++)
    newcoeff[j] = coeff[j];
  
-  std::cout<<"**************** Begin of Error Calculation ****************"<<std::endl;
+  utils::logmesg(lmp, "**************** Begin of Error Calculation ****************\n");
  
  int ci = 0; // configuration counter  
  int nc = 0, nf = 0;  
@ -1415,7 +1418,7 @@ void CPODFIT::error_analsysis(datastruct data, double *coeff)
    int nconfigs = data.num_config[file];
    nc += nconfigs;
    for (int ii=0; ii < nconfigs; ii++) { // loop over each configuration in a file
-      if ((ci % 100)==0) std::cout<<"Configuration: # "<<ci+1<<std::endl;
+      if ((ci % 100)==0) utils::logmesg(lmp, "Configuration: # {}\n", ci+1);
      
      int natom = data.num_atom[ci];
      int nforce = dim*natom;
@ -1473,7 +1476,7 @@ void CPODFIT::error_analsysis(datastruct data, double *coeff)
  errors[2] = errors[2]/nf;
  errors[3] = sqrt(errors[3]/nf);
  
-  std::cout<<"**************** End of Error Calculation ****************"<<std::endl<<std::endl;
+  utils::logmesg(lmp, "**************** End of Error Calculation ****************\n");
  
  print_analysis(data, outarray, errors);  
 }
@ -1487,14 +1490,14 @@ void CPODFIT::energyforce_calculation(datastruct data, double *coeff)
  int nfiles = data.data_files.size();  // number of files  

                
-  std::cout<<"**************** Begin of Energy/Force Calculation ****************"<<std::endl;
+  utils::logmesg(lmp, "**************** Begin of Energy/Force Calculation ****************\n");
  
  int ci = 0; // configuration counter  
  for (int file = 0; file < nfiles; file++) { // loop over each file in the data set
    
    int nconfigs = data.num_config[file];
    for (int ii=0; ii < nconfigs; ii++) { // loop over each configuration in a file
-      if ((ci % 100)==0) std::cout<<"Configuration: # "<<ci+1<<std::endl;
+      if ((ci % 100)==0) utils::logmesg(lmp, "Configuration: # {}\n", ci+1);
      
      int natom = data.num_atom[ci];
      int nforce = dim*natom;
@ -1510,7 +1513,7 @@ void CPODFIT::energyforce_calculation(datastruct data, double *coeff)
      writearray2file(filename.c_str(), force, 1 + nforce, 1);
    }
  }     
-  std::cout<<"**************** End of Energy/Force Calculation ****************"<<std::endl<<std::endl;  
+  utils::logmesg(lmp, "**************** End of Energy/Force Calculation ****************\n");
 }

 #endif    
--- a/src/ML-POD/pair_pod.cpp
+++ b/src/ML-POD/pair_pod.cpp
--- a/src/ML-POD/pair_pod.h
+++ b/src/ML-POD/pair_pod.h
@ -13,94 +13,22 @@ PairStyle(pod,CPairPOD);
 namespace LAMMPS_NS {

  class CPairPOD : public Pair {
-  private:
-      std::vector<std::string> globVector(const std::string& pattern, std::vector<std::string> & files);
-          
-      bool is_a_number(std::string line);
-      
-      int latticecoords(double *y, int *alist, double *x, double *a1, double *a2, double *a3, double rcut, int *pbc, int nx);
-      
-      int podneighborcount(double *r, double rcutsq, int nx, int N, int dim);
-      int podneighborlist(int *neighlist, int *numneigh, double *r, double rcutsq, int nx, int N, int dim);
-      
-      void read_data_file(double *inputs, std::string &file_format, std::string &file_extension, 
-          std::string &data_path, std::string data_file);
-
-      void get_exyz_files(std::vector<std::string>& files, std::string datapath, std::string extension);
-      
-      int get_number_atom_exyz(std::vector<int>& num_atom, int& num_atom_sum, std::string file);  
-      
-      int get_number_atoms(std::vector<int>& num_atom, std::vector<int> &num_atom_sum, std::vector<int>& num_config, std::vector<std::string> training_files);  
-      
-      void read_exyz_file(double *lattice, double *stress, double *energy, double *pos, double *vel, 
-              double *forces, int *atomtype, std::string file, std::vector<std::string> species);
-      
-      void get_data(std::vector<std::string> species);
-
-      void read_data_files(std::string data_file, std::vector<std::string> species);    
-      
-  public:
-      struct datastruct {     
-          std::string file_format;
-          std::string file_extension;    
-          std::string data_path;    
-          std::vector<std::string> data_files;     
-          std::vector<std::string> filenames;     
-
-          std::vector<int> num_atom;
-          std::vector<int> num_atom_cumsum;
-          std::vector<int> num_atom_each_file;
-          std::vector<int> num_config;
-          std::vector<int> num_config_cumsum;
-          int num_atom_sum; 
-          int num_atom_min; 
-          int num_atom_max; 
-          int num_config_sum;    
-
-          double *lattice=NULL;
-          double *energy=NULL; 
-          double *stress=NULL;
-          double *position=NULL;
-          double *velocity=NULL;
-          double *force=NULL;
-          int *atomtype=NULL;
-
-          void copydatainfo(datastruct &data) {
-              data.data_path = data_path;        
-              data.file_format = file_format;
-              data.file_extension = file_extension;              
-              data.data_files = data_files;
-              data.filenames = filenames;            
-          }                
-
-          void freememory(int backend)
-          {
-              TemplateFree(lattice, backend);        
-              TemplateFree(energy, backend);        
-              TemplateFree(stress, backend);        
-              TemplateFree(position, backend);  
-              TemplateFree(velocity, backend);  
-              TemplateFree(force, backend);        
-              TemplateFree(atomtype, backend);        
-          }            
-      };
-
-      datastruct data;
+    public:
      class CPOD *podptr;
-      
+
      CPairPOD(class LAMMPS *);
      ~CPairPOD() override;
      void compute(int, int) override;
-      
+
      void settings(int, char **) override;
      void coeff(int, char **) override;
      void init_style() override;
      double init_one(int, int) override;
      double memory_usage() override;
      void *extract(const char *, int &) override;
-    
-      void InitPairPOD(std::string pod_file, std::string coeff_file, std::string data_file); 
-      
+
+      void InitPairPOD(std::string pod_file, std::string coeff_file);
+
      int backend=1;
      int dim = 3;
      int atommemory = 0;
@ -112,129 +40,125 @@ namespace LAMMPS_NS {
      int savefrequency = 0;
      int blocksize=8192;      // avereage size of computation blocks
      int randomrotation = 0;
-      
-      double energy=0.0;    // potential energy    
+
+      double energy=0.0;    // potential energy
      double *forces=NULL;   // atomic forces
      double *stress=NULL;  // stress tensor
      int *atomtype=NULL;   // atomic types for all atoms
      double *pos=NULL;     // positions of atoms
      double *vel=NULL;     // velocity of atoms
-      
-      double *gd=NULL;         // global linear descriptors 
-      double *podcoeff=NULL;   // POD coefficients  
-      double *newpodcoeff=NULL;// normalized POD coefficients  
+
+      double *gd=NULL;         // global linear descriptors
+      double *podcoeff=NULL;   // POD coefficients
+      double *newpodcoeff=NULL;// normalized POD coefficients
      double *energycoeff=NULL; // energy coefficients
      double *forcecoeff=NULL; // force coefficients
-      
-      double *y=NULL;      // [dim * nmaxatom] positions of own and ghost atoms        
-      int *atomID=NULL;  // [nmaxatom]  IDs of owned and ghost atoms      
-      int *pairlist=NULL;  // [nmaxpairs] indices of neighbors for owned atoms    
-      int *pairnum=NULL;   // [nmaxatom] number of pairs for all atoms i 
+
+      double *y=NULL;      // [dim * nmaxatom] positions of own and ghost atoms
+      int *atomID=NULL;  // [nmaxatom]  IDs of owned and ghost atoms
+      int *pairlist=NULL;  // [nmaxpairs] indices of neighbors for owned atoms
+      int *pairnum=NULL;   // [nmaxatom] number of pairs for all atoms i
      int *pairnumsum=NULL;// [nmaxatom+1] cumulative sum of pairnum
-      
-      int numatoms=0;    // number of atom in the simulation box    
-      int nlocalatom=0;  // number of owned atoms    
+
+      int numatoms=0;    // number of atom in the simulation box
+      int nlocalatom=0;  // number of owned atoms
      int nghostatom=0;  // number of ghost atoms
      int ntotalatom=0;  // number of owned + ghost atoms
      int nlocalmax=0;   // maximum number of owned atoms
-      int nmaxatom=0;    // maximum number of atoms (nmaxatom >= ntotalatom)   
-      int natompairs=0;  // total number of atom pairs for owned atoms    
-      int nmaxpairs=0;   // maximum number of atom pairs for owned atoms    
-      
-      void check_tempmemory(int start, int end);       
+      int nmaxatom=0;    // maximum number of atoms (nmaxatom >= ntotalatom)
+      int natompairs=0;  // total number of atom pairs for owned atoms
+      int nmaxpairs=0;   // maximum number of atom pairs for owned atoms
+
+      void check_tempmemory(int start, int end);
      void check_tempmemory(double **x, int **firstneigh, int *numneigh, int *ilist, int start, int end);
-      void estimate_tempmemory();    
+      void estimate_tempmemory();
      void free_tempmemory();
      void allocate_tempmemory();
-          
-      void check_pairmemory(double *x, double *a1, double *a2, double *a3, int natom);    
-      void free_pairmemory();
-      void allocate_pairmemory();
-      
+
      void check_atommemory(int inum, int nall);
-      void free_atommemory();    
-      void allocate_atommemory();    
-      
-      void free_memory();            
+      void free_atommemory();
+      void allocate_atommemory();
+
+      void free_memory();
      void allocate_memory();
-      void estimate_memory(datastruct data);    
-          
+      void estimate_memory(datastruct data);
+
      void get_atomblocks(int natom);
-      
-      int podfullneighborlist(double *y, int *alist, int *pairlist, int *pairnum, int *pairnumsum, 
+
+      int podfullneighborlist(double *y, int *alist, int *pairlist, int *pairnum, int *pairnumsum,
          double *x, double *a1, double *a2, double *a3, double rcut, int *pbc, int nx);
-          
+
      void podNeighPairs(int *atomtype, int istart, int iend);
-          
-      void lammpsNeighPairs(double **x, int **firstneigh, int *atomtype, int *numneigh, 
+
+      void lammpsNeighPairs(double **x, int **firstneigh, int *atomtype, int *numneigh,
              int *ilist, int istart, int iend);
-              
+
      void lammpsNeighPairs(double **x, int **firstneigh, int *atomtype, int *map, int *numneigh, int i);
      
-      double podenergy(double *x, double *a1, double *a2, double *a3, int *atomtype, int inum);    
+      double podenergy(double *x, double *a1, double *a2, double *a3, int *atomtype, int inum);
      double podeatom(double *eatom, double *x, double *a1, double *a2, double *a3, int *atomtypes, int inum);
      void podforce(double *f, double *x, double *a1, double *a2, double *a3, int *atomtypes, int inum);
-      double podenergyforce(double *f, double *x, double *a1, double *a2, double *a3, int *atomtype, int inum);      
-      
+      double podenergyforce(double *f, double *x, double *a1, double *a2, double *a3, int *atomtype, int inum);
+
      double lammpsenergy(double **x, int **firstneigh, int *atype, int *numneigh, int *ilist, int inum, int nall);
-      double lammpseatom(double *eatom, double **x, int **firstneigh, int *atomtypes, int *numneigh, 
+      double lammpseatom(double *eatom, double **x, int **firstneigh, int *atomtypes, int *numneigh,
          int *ilist, int inum, int nall);
-      void lammpsforce(double **f, double **x, int **firstneigh, int *atomtypes, 
+      void lammpsforce(double **f, double **x, int **firstneigh, int *atomtypes,
          int *numneigh, int *ilist, int inum, int nall);
-      double lammpsenergyforce(double **f, double **x, int **firstneigh, int *atomtype, int *numneigh, int *ilist, int inum, int nall);     
-              
-      
+      double lammpsenergyforce(double **f, double **x, int **firstneigh, int *atomtype, int *numneigh, int *ilist, int inum, int nall);
+
+
      void print_analysis(double *outarray, double *errors);
      void error_analsysis();
-      
+
      void printinfo()
-      {        
-          printf("print pairpod information: \n"); 
-          printf("backend %d \n", backend); 
-          printf("podpairlist %d \n", podpairlist);         
-          printf("lammpspairlist %d \n", lammpspairlist);         
-          printf("analysis %d \n", analysis);         
-          printf("runMD %d \n", runMD); 
+      {
+          printf("print pairpod information: \n");
+          printf("backend %d \n", backend);
+          printf("podpairlist %d \n", podpairlist);
+          printf("lammpspairlist %d \n", lammpspairlist);
+          printf("analysis %d \n", analysis);
+          printf("runMD %d \n", runMD);
          printf("savecalculation %d \n", savecalculation);
-          printf("savefrequency %d \n", savefrequency);       
+          printf("savefrequency %d \n", savefrequency);
          printf("numatoms %d \n", numatoms);
          printf("nlocalatom %d \n", nlocalatom);
          printf("nghostatom %d \n", nghostatom);
          printf("ntotalatom %d \n", ntotalatom);
          printf("nlocalmax %d \n", nlocalmax);
          printf("nmaxatom %d \n", nmaxatom);
-          printf("natompairs %d \n", natompairs);        
-          printf("nmaxpairs %d \n", nmaxpairs);                       
-          printf("numblocks %d \n", numblocks);        
+          printf("natompairs %d \n", natompairs);
+          printf("nmaxpairs %d \n", nmaxpairs);
+          printf("numblocks %d \n", numblocks);
          printf("blocksize %d \n", blocksize);
          printf("nablock %d \n", nablock);
-          printf("nablockmax %d \n", nablockmax);       
-          printf("nij %d \n", nij);       
-          printf("nijmax %d \n", nijmax);       
-          printf("szd %d \n", szd);       
-      }    
-          
+          printf("nablockmax %d \n", nablockmax);
+          printf("nij %d \n", nij);
+          printf("nijmax %d \n", nijmax);
+          printf("szd %d \n", szd);
+      }
+
  protected:
-      int atomblocks[1001]; // store sizes of computation blocks   
-      int numblocks=1;      // number of computation blocks                        
-      int nablock=0;        // number of atoms per computation block    
-      int nablockmax=0;     // maximum number of atoms per computation block    
-      int nij=0;    //  number of atom pairs per computation block    
-      int nijmax=0;  // maximum number of atom pairs per computation block              
+      int atomblocks[1001]; // store sizes of computation blocks
+      int numblocks=1;      // number of computation blocks
+      int nablock=0;        // number of atoms per computation block
+      int nablockmax=0;     // maximum number of atoms per computation block
+      int nij=0;    //  number of atom pairs per computation block
+      int nijmax=0;  // maximum number of atom pairs per computation block
      int szd=0;    // size of tmpmem
-      
-      // temporary arrays for computation blocks  
+
+      // temporary arrays for computation blocks
      double *tmpmem=NULL;  // temporary memory
      int *typeai=NULL;     // types of atoms I only
-      int *numneighsum=NULL;// cumulative sum for an array of numbers of neighbors    
+      int *numneighsum=NULL;// cumulative sum for an array of numbers of neighbors
      double *rij=NULL;     // (xj - xi) for all pairs (I, J)
      int *idxi=NULL;       // storing linear indices for all pairs (I, J)
      int *ai=NULL;         // IDs of atoms I for all pairs (I, J)
      int *aj=NULL;         // IDs of atoms J for all pairs (I, J)
-      int *ti=NULL;         // types of atoms I for all pairs (I, J) 
+      int *ti=NULL;         // types of atoms I for all pairs (I, J)
      int *tj=NULL;         // types of atoms J  for all pairs (I, J)
-          
-      double **scale;         // for thermodynamic integration        
+
+      double **scale;         // for thermodynamic integration
  };

 }    // namespace LAMMPS_NS
--- a/src/ML-POD/pod.cpp
+++ b/src/ML-POD/pod.cpp