Physics class + Lassen compatibility (#2)

* physics class * generalized physics solution shape in latent space. * minor * updated README * activation for autoencoder * lassen compatible.
LLNL · Jul 3, 2024 · 9b4cb93 · 9b4cb93
1 parent 4ebad94
commit 9b4cb93
Show file tree

Hide file tree

Showing 11 changed files with 538 additions and 220 deletions.
diff --git a/.gitignore b/.gitignore
@@ -6,3 +6,4 @@ examples/data
 examples/results
 examples/checkpoint
 *.npy
+build
diff --git a/README.md b/README.md
@@ -25,6 +25,44 @@ make install
 
 Please install [OpenCE-1.1.2](https://lc.llnl.gov/confluence/pages/viewpage.action?pageId=678892406)
 
+## Python packaging (work-in-progress)
+
+The repository is in transition to python packaging. Users can install the repository as a python package:
+```
+pip install .
+```
+This python package requires updated prerequistes:
+```
+"torch>=2.3.0",
+"numpy>=1.26.4",
+"scikit-learn>=1.4.2",
+"scipy>=1.13.1",
+"pyyaml>=6.0",
+"matplotlib>=3.8.4",
+"argparse>=1.4.0"
+```
+
+Currently, not all features are supported. The example of Burgers 1D equation can be run:
+```
+cd examples
+lasdi burgers1d.yml
+```
+Post-processing & visualization of the Burgers 1D equation can be seen in the jupyter notebook `examples/burgers1d.ipynb`.
+
+### For LLNL LC Lassen users
+
+The work-in-progress python package is compatiable with [OpenCE-1.9.1](https://lc.llnl.gov/confluence/pages/viewpage.action?pageId=785286611).
+For installing GPLasDI on opence environment:
+```
+source /your/anaconda
+conda activate /your/opence/environment
+
+conda install scikit-learn
+pip install argparse
+
+pip install .
+```
+
 ## Examples
 
 Four examples are provided, including

diff --git a/examples/burgers1d.ipynb b/examples/burgers1d.ipynb
diff --git a/examples/burgers1d.yml b/examples/burgers1d.yml
@@ -9,14 +9,8 @@ lasdi:
     max_greedy_iter: 28000
     sindy_weight: 0.1
     coef_weight: 1.e-6
-    path_checkpoint: checkpoint/
-    path_results: results/
-    # This probably should be specified on physics part.
-    time_dim: 1001
-    space_dim: 1001
-    xmin: -3.
-    xmax: 3.
-    tmax: 1.
+    path_checkpoint: checkpoint
+    path_results: results
     # This probably should be specified as parameters.
     a_min: 0.7
     a_max: 0.9
@@ -33,21 +27,16 @@ latent_space:
     hidden_units: [100]
     latent_dimension: 5
 
+# TODO(kevin): temporary placeholder
+initial_train:
+  train_data: data/data_train.npy
+  test_data: data/data_test.npy
+
 physics:
   type: burgers1d
   burgers1d:
-    time_dim: 1001
-    space_dim: 1001
+    number_of_timesteps: 1001
+    simulation_time: 1.
+    grid_size: [1001]
     xmin: -3.
     xmax: 3.
-    tmax: 1.
-    initial_train:
-      train_data: data/data_train.npy
-      test_data: data/data_test.npy
-      # This probably should be specified as parameters.
-      a_min: 0.7
-      a_max: 0.9
-      w_min: 0.9
-      w_max: 1.1
-      n_a_grid: 21
-      n_w_grid: 21
diff --git a/pyproject.toml b/pyproject.toml
@@ -8,20 +8,20 @@ authors = [
 ]
 description = "LaSDI: Parametric latent space dynamics identification"
 readme = "README.md"
-requires-python = ">=3.12"
+requires-python = ">=3.9"
 classifiers = [
     "Programming Language :: Python :: 3",
     "License :: OSI Approved :: MIT License",
     "Operating System :: OS Independent",
 ]
 dependencies = [
-  "torch>=2.3.0",
-  "numpy>=1.26.4",
-  "scikit-learn>=1.4.2",
-  "scipy>=1.13.1",
+  "torch>=2.0.1",
+  "numpy>=1.23.0",
+  "scikit-learn>=1.3",
+  "scipy>=1.10",
   "pyyaml>=6.0",
-  "matplotlib>=3.8.4",
-  "argparse>=1.4.0"
+  "matplotlib>=3.8.0",
+  "argparse>=1.1"
 ]
 
 [project.urls]

diff --git a/src/lasdi/gplasdi.py b/src/lasdi/gplasdi.py
@@ -35,7 +35,7 @@ def find_sindy_coef(Z, Dt, n_train, time_dim, loss_function):
     return loss_sindy, loss_coef, sindy_coef
 
 class BayesianGLaSDI:
-    def __init__(self, autoencoder, model_parameters):
+    def __init__(self, autoencoder, physics, model_parameters):
 
         '''
 
@@ -47,28 +47,7 @@ def __init__(self, autoencoder, model_parameters):
         '''
 
         self.autoencoder = autoencoder
-
-        # TODO(kevin): we need to simply possess physics object.
-        self.time_dim = model_parameters['time_dim']
-        self.space_dim = model_parameters['space_dim']
-        # self.n_z = model_parameters['n_z']
-
-        # TODO(kevin): we need to simply possess physics object.
-        xmin = model_parameters['xmin']
-        xmax = model_parameters['xmax']
-        self.Dx = (xmax - xmin) / (self.space_dim - 1)
-        assert(self.Dx > 0.)
-
-        tmax = model_parameters['tmax']
-        self.Dt = tmax / (self.time_dim - 1)
-
-        self.x_grid = np.linspace(xmin, xmax, self.space_dim)
-        self.t_grid = np.linspace(0, tmax, self.time_dim)
-
-        # TODO(kevin): generalize physics
-        # self.initial_condition = model_parameters['initial_condition']
-        from .physics.burgers1d import initial_condition
-        self.initial_condition = initial_condition
+        self.physics = physics
 
         # TODO(kevin): generalize parameters
         self.a_min = model_parameters['a_min']
@@ -131,6 +110,9 @@ def train(self):
         end_train_phase = []
         end_fom_phase = []
 
+        from pathlib import Path
+        Path(self.path_checkpoint).mkdir(parents=True, exist_ok=True)
+        Path(self.path_results).mkdir(parents=True, exist_ok=True)
 
         start_train_phase.append(tic_start)
 
@@ -142,7 +124,7 @@ def train(self):
             Z = Z.cpu()
 
             loss_ae = self.MSE(X_train_device, X_pred)
-            loss_sindy, loss_coef, sindy_coef = find_sindy_coef(Z, self.Dt, self.n_train, self.time_dim, self.MSE)
+            loss_sindy, loss_coef, sindy_coef = find_sindy_coef(Z, self.physics.dt, self.n_train, self.physics.nt, self.MSE)
 
             max_coef = np.abs(np.array(sindy_coef)).max()
 
@@ -152,7 +134,7 @@ def train(self):
             self.optimizer.step()
 
             if loss.item() < self.best_loss:
-                torch.save(autoencoder_device.state_dict(), self.path_checkpoint + 'checkpoint.pt')
+                torch.save(autoencoder_device.state_dict(), self.path_checkpoint + '/' + 'checkpoint.pt')
                 self.best_sindy_coef = sindy_coef
                 self.best_loss = loss.item()
 
@@ -184,19 +166,19 @@ def train(self):
                 start_fom_phase.append(time.time())
                 # X_train = X_train_device.cpu()
                 autoencoder = autoencoder_device.cpu()
-                autoencoder.load_state_dict(torch.load(self.path_checkpoint + 'checkpoint.pt'))
+                autoencoder.load_state_dict(torch.load(self.path_checkpoint + '/' + 'checkpoint.pt'))
 
                 if len(self.best_sindy_coef) == self.n_train:
                     sindy_coef = self.best_sindy_coef
 
-                Z0 = initial_condition_latent(self.param_grid, self.initial_condition, self.x_grid, autoencoder)
+                Z0 = initial_condition_latent(self.param_grid, self.physics, autoencoder)
 
                 interpolation_data = build_interpolation_data(sindy_coef, self.param_train)
                 gp_dictionnary = fit_gps(interpolation_data)
                 n_coef = interpolation_data['n_coef']
 
                 coef_samples = [interpolate_coef_matrix(gp_dictionnary, self.param_grid[i, :], self.n_samples, n_coef, sindy_coef) for i in range(self.n_test)]
-                Zis = [simulate_uncertain_sindy(gp_dictionnary, self.param_grid[i, 0], self.n_samples, Z0[i], self.t_grid, sindy_coef, n_coef, coef_samples[i]) for i in range(self.n_test)]
+                Zis = [simulate_uncertain_sindy(gp_dictionnary, self.param_grid[i, 0], self.n_samples, Z0[i], self.physics.t_grid, sindy_coef, n_coef, coef_samples[i]) for i in range(self.n_test)]
 
                 a_index, w_index, m_index = get_max_std(autoencoder, Zis, self.n_a_grid, self.n_w_grid)
 
@@ -222,34 +204,30 @@ def train(self):
                            'n_greedy': self.n_greedy, 'sindy_weight': self.sindy_weight, 'coef_weight': self.coef_weight,
                            'n_init': self.n_init, 'n_samples' : self.n_samples, 'n_a_grid' : self.n_a_grid, 'n_w_grid' : self.n_w_grid,
                            'a_grid' : self.a_grid, 'w_grid' : self.w_grid,
-                           't_grid' : self.t_grid, 'x_grid' : self.x_grid, 'Dt' : self.Dt, 'Dx' : self.Dx,
                            # TODO(kevin): need to fix timer.
                            'total_time' : total_time, 'start_train_phase' : start_train_phase,
                            'start_fom_phase' : start_fom_phase, 'end_train_phase' : end_train_phase, 'end_fom_phase' : end_fom_phase}
+        bglasdi_results['physics'] = self.physics.export()
 
         date = time.localtime()
         date_str = "{month:02d}_{day:02d}_{year:04d}_{hour:02d}_{minute:02d}"
         date_str = date_str.format(month = date.tm_mon, day = date.tm_mday, year = date.tm_year, hour = date.tm_hour + 3, minute = date.tm_min)
-        np.save(self.path_results + 'bglasdi_' + date_str + '.npy', bglasdi_results)
+        np.save(self.path_results + '/' + 'bglasdi_' + date_str + '.npy', bglasdi_results)
 
         next_step, result = None, Result.Complete
         return result, next_step
 
     def sample_fom(self):
 
-        # TODO(kevin): generalize this physics part.
-        from .physics.burgers1d import solver
-
+        # TODO(kevin): generalize the parameter class.
         new_a, new_b = self.new_param[0], self.new_param[1]
-        # TODO(kevin): generalize this physics part.
-        u0 = self.initial_condition(new_a, new_b, self.x_grid)
-
-        maxk = 10
-        convergence_threshold = 1e-8
-        new_X = solver(u0, maxk, convergence_threshold, self.time_dim - 1, self.space_dim, self.Dt, self.Dx)
-        new_X = new_X.reshape(1, self.time_dim, self.space_dim)
-        new_X = torch.Tensor(new_X)
-
-        self.X_train = torch.cat([self.X_train, new_X], dim = 0)
-        self.param_train = np.vstack((self.param_train, np.array([[new_a, new_b]])))
-        self.n_train += 1
+
+        if not self.physics.offline:
+            new_X = self.physics.solve(self.new_param)
+
+            self.X_train = torch.cat([self.X_train, new_X], dim = 0)
+            self.param_train = np.vstack((self.param_train, np.array([[new_a, new_b]])))
+            self.n_train += 1
+        else:
+            # TODO(kevin): interface for offline FOM simulation
+            raise RuntimeError("Offline FOM simulation is not supported yet!")
diff --git a/src/lasdi/inputs.py b/src/lasdi/inputs.py
@@ -0,0 +1,66 @@
+from warnings import warn
+
+verbose = False
+
+class InputParser:
+    dict_ = None
+    name = ""
+
+    def __init__(self, dict, name = ""):
+        from copy import deepcopy
+        self.dict_ = deepcopy(dict)
+        self.name = name
+        return
+
+    def getInput(self, keys, fallback=None, datatype=None):
+        '''
+            Find the value corresponding to the list of keys.
+            If the specified keys do not exist, use the fallback value.
+            If the fallback value does not exist, returns an error.
+            If the datatype is specified, enforce the output value has the right datatype.
+        '''
+        keyString = ""
+        for key_ in keys:
+            keyString += key_ + "/"
+
+        val = self.dict_
+        for key in keys:
+            if key in val:
+                val = val[key]
+            elif (fallback != None):
+                return fallback
+            else:
+                raise RuntimeError("%s does not exist in the input dictionary %s!" % (keyString, self.name))
+
+        if (fallback != None):
+            if (type(val) != type(fallback)):
+                raise RuntimeError("%s does not match the type with the fallback value %s!" % (str(type(val)), str(type(fallback))))
+        elif (datatype != None):
+            if (type(val) != datatype):
+                raise RuntimeError("%s does not match the specified datatype %s!" % (str(type(val)), str(datatype)))
+        else:
+            if verbose: warn("InputParser Warning: datatype is not checked.\n key: %s\n value type: %s" % (keys, type(val)))
+        return val
+
+def getDictFromList(list_, inputDict):
+    '''
+        get a dict with {key: val} from a list of dicts
+        NOTE: it returns only the first item in the list,
+            even if the list has more than one dict with {key: val}.
+    '''
+    dict_ = None
+    for item in list_:
+        isDict = True
+        for key, val in inputDict.items():
+            if key not in item:
+                isDict = False
+                break
+            if (item[key] != val):
+                isDict = False
+                break
+        if (isDict):
+            dict_ = item
+            break
+    if (dict_ == None):
+        raise RuntimeError('Given list does not have a dict with {%s: %s}!' % (key, val))
+    return dict_
-Original file line number
+Diff line change
@@ Expand Up / @@ -6,3 +6,4 @@ examples/data @@
     examples/results
     examples/checkpoint
     *.npy
+    build