2 years ago · 0ab0e0ce57
--- a/src/dinn.py
+++ b/src/dinn.py
@@ -1,16 +1,10 @@
 
															 import torch
														
 
															-import os
														
 
															-import imageio
														
 
															 import numpy as np
														
 
															-import matplotlib.pyplot as plt
														
 
															-from matplotlib import rcParams
														
 
															 from .dataset import PandemicDataset
														
 
															 from .problem import PandemicProblem
														
 
															 from .plotter import Plotter
														
 
															-
														
 
															-
														
 
															 class DINN:
														
 
															     class NN(torch.nn.Module):
														
 
															         def __init__(self, 
														
@@ -48,55 +42,68 @@ class DINN:
 
															             return x
														
 
															     def __init__(self,
														
 
															-                 number_groups: int,
														
 
															+                 output_size: int,
														
 
															                  data: PandemicDataset,
														
 
															                  parameter_list: list,
														
 
															                  problem: PandemicProblem,
														
 
															                  plotter: Plotter,
														
 
															+                 state_variables=[],
														
 
															                  parameter_regulator=torch.tanh,
														
 
															-                 input_size=1,
														
 
															-                 hidden_size=20,
														
 
															+                 input_size=1, 
														
 
															+                 hidden_size=20, 
														
 
															                  hidden_layers=7, 
														
 
															                  activation_layer=torch.nn.ReLU()) -> None:
														
 
															         """Desease Informed Neural Network. Uses the PandemicProblem, DINN.NN and PandemicDataset to solve Inverse Problems and find the 
														
 
															         parameters of a specific mathematical model.
														
 
															         Args:
														
 
															-            number_groups (int): The number of groups, that the population is split into.
														
 
															+            output_size (int): Number of the output nodes of the NN.
														
 
															             data (PandemicDataset): Data collected showing the course of the pandemic
														
 
															             parameter_list (list): List of the parameter names(strings), that are supposed to be found.
														
 
															             problem (PandemicProblem): Problem class implementing the calculation of the residuals.
														
 
															             plotter (Plotter): Plotter object to plot dataset curves.
														
 
															+            state_variables (list, optional): List of the names of state variables. Defaults to [].
														
 
															             parameter_regulator (optional): Function to force the parameters to be in a certain range. Defaults to torch.tanh.
														
 
															             input_size (int, optional): Number of the input nodes of the NN. Defaults to 1.
														
 
															             hidden_size (int, optional): Number of the hidden nodes of the NN. Defaults to 20.
														
 
															             hidden_layers (int, optional): Number of the hidden layers for the NN. Defaults to 7.
														
 
															             activation_layer (optional): Class of the activation function. Defaults to torch.nn.ReLU().
														
 
															         """
														
 
															-        
														
 
															+        assert len(state_variables) + data.number_groups == output_size, f'The number of groups plus the number of state variable must result in the output size\nGroups:\t{data.number_groups}\nState variables:\t{len(state_variables)}\noutput_size: {output_size}\n'
														
 
															         self.device = torch.device(data.device_name)
														
 
															         self.device_name = data.device_name
														
 
															         self.plotter = plotter
														
 
															-        self.model = DINN.NN(number_groups, input_size, hidden_size, hidden_layers, activation_layer, data.t_init, data.t_final)
														
 
															+        self.model = DINN.NN(output_size, 
														
 
															+                             input_size, 
														
 
															+                             hidden_size, 
														
 
															+                             hidden_layers, 
														
 
															+                             activation_layer, 
														
 
															+                             data.t_init, 
														
 
															+                             data.t_final)
														
 
															         self.model = self.model.to(self.device)
														
 
															         self.data = data
														
 
															         self.parameter_regulator = parameter_regulator
														
 
															         self.problem = problem
														
 
															+        self.problem.def_grad_matrix(output_size)
														
 
															         self.parameters_tilda = {}
														
 
															         for parameter in parameter_list:
														
 
															             self.parameters_tilda.update({parameter : torch.nn.Parameter(torch.rand(1, requires_grad=True, device=self.device_name))})
														
 
															-        
														
 
															-        self.epochs = None
														
 
															-        self.losses = np.zeros(1)
														
 
															-        self.obs_losses = np.zeros(1)
														
 
															-        self.physics_losses = np.zeros(1)
														
 
															+        # new model has to be configured and then trained
														
 
															+        self.__is_configured = False
														
 
															+        self.__has_trained = False
														
 
															+
														
 
															+        self.__state_variables = state_variables
														
 
															+
														
 
															         self.parameters = [np.zeros(1) for _ in range(len(parameter_list))]
														
 
															         self.frames = []
														
 
															+    @property
														
 
															+    def number_state_variables(self):
														
 
															+        return len(self.__state_variables)
														
 
															     def get_regulated_param(self, parameter_name: str):
														
 
															         """Function to get the searched parameters, forced into a certain range.
														
@@ -125,40 +132,77 @@ class DINN:
 
															         """
														
 
															         return [self.parameter_regulator(parameter) for parameter in self.get_parameters_tilda()]
														
 
															+    def configure_training(self, lr:float, epochs:int, optimizer_name='Adam', scheduler_name='CyclicLR', scheduler_factor = 1, verbose=False):
														
 
															+        """This method sets the optimizer, scheduler, learning rate and number of epochs for the following training process.
														
 
															+
														
 
															+        Args:
														
 
															+            lr (float): Learning rate for the optimizer.
														
 
															+            epochs (int): Number of epochs the NN is supposed to be trained for.
														
 
															+            optimizer_name (str, optional): Name of the optimizer class that is supposed to be used. Defaults to 'Adam'.
														
 
															+            scheduler_name (str, optional): Name of the scheduler class that is supposed to be used. Defaults to 'CyclicLR'.
														
 
															+            verbose (bool, optional): Controles if the configuration process, is to be verbosed. Defaults to False.
														
 
															+        """
														
 
															+        parameter_list = list(self.model.parameters()) + list(self.parameters_tilda.values())
														
 
															+        self.epochs = epochs
														
 
															+        match optimizer_name:
														
 
															+            case 'Adam':
														
 
															+                self.optimizer = torch.optim.Adam(parameter_list, lr=lr)
														
 
															+            case _:
														
 
															+                self.optimizer = torch.optim.Adam(parameter_list, lr=lr)
														
 
															+                if verbose:
														
 
															+                    print('---------------------------------')
														
 
															+                    print(f' Entered unknown optimizer name: {optimizer_name}\n Defaulted to Adam.')
														
 
															+                    print('---------------------------------')
														
 
															+                optimizer_name = 'Adam'
														
 
															+
														
 
															+        match scheduler_name:
														
 
															+            case 'CyclicLR':
														
 
															+                self.scheduler = torch.optim.lr_scheduler.CyclicLR(self.optimizer, base_lr=lr * 10, max_lr=lr * 1e3, step_size_up=1000, mode="exp_range", gamma=0.85, cycle_momentum=False)
														
 
															+            case 'LinearLR':
														
 
															+                self.scheduler = torch.optim.lr_scheduler.LinearLR(self.optimizer, start_factor=lr, total_iters=epochs/scheduler_factor)
														
 
															+            case 'PolynomialLR':
														
 
															+                self.scheduler = torch.optim.lr_scheduler.PolynomialLR(self.optimizer, total_iters=epochs/scheduler_factor, power=1.0)
														
 
															+            case _:
														
 
															+                self.scheduler = torch.optim.lr_scheduler.CyclicLR(self.optimizer, base_lr=lr * 10, max_lr=lr * 1e3, step_size_up=1000, mode="exp_range", gamma=0.85, cycle_momentum=False)
														
 
															+                if verbose:
														
 
															+                    print('---------------------------------')
														
 
															+                    print(f' Entered unknown scheduler name: {scheduler_name}\n Defaulted to CyclicLR.')
														
 
															+                    print('---------------------------------')
														
 
															+                scheduler_name = 'CyclicLR'
														
 
															+
														
 
															+        if verbose:
														
 
															+            print(f'\nLearning Rate:\t{lr}\nOptimizer:\t{optimizer_name}\nScheduler:\t{scheduler_name}\n')
														
 
															+
														
 
															+        self.__is_configured = True
														
 
															+
														
 
															+    
														
 
															     def train(self, 
														
 
															-              epochs: int, 
														
 
															-              lr: float, 
														
 
															-              optimizer_class=torch.optim.Adam,
														
 
															               create_animation=False,
														
 
															-              animation_sample_rate=500):
														
 
															-        """Training routine for the DINN
														
 
															+              animation_sample_rate=500,
														
 
															+              verbose=False):
														
 
															+        """Training routine for the DINN.
														
 
															         Args:
														
 
															-            epochs (int): Number of epochs the NN is supposed to be trained for.
														
 
															-            lr (float): Learning rate for the optimizer.
														
 
															-            optimizer_class (optional): Class of the optimizer. Defaults to torch.optim.Adam.
														
 
															             create_animation (boolean, optional): Decides on wether a prediction animation is supposed to be created during training. Defaults to False.
														
 
															             animation_sample_rate (int, optional): Sample rate of the prediction animation. Only used, when create_animation=True. Defaults to 500.
														
 
															+            verbose (bool, optional): Controles if the training process, is to be verbosed. Defaults to False.
														
 
															         """
														
 
															-
														
 
															-        # define optimizer and scheduler
														
 
															-        optimizer = optimizer_class(list(self.model.parameters()) + list(self.parameters_tilda.values()), lr=lr)
														
 
															-        scheduler = torch.optim.lr_scheduler.CyclicLR(optimizer, base_lr=1e-5, max_lr=1e-3, step_size_up=1000, mode="exp_range", gamma=0.85, cycle_momentum=False)
														
 
															-
														
 
															-        self.epochs = epochs
														
 
															-
														
 
															+        assert self.__is_configured, 'The model has to be configured before training through the use of self.configure training.'
														
 
															+        if verbose:
														
 
															+            print(f'torch seed: {torch.seed()}')
														
 
															+        
														
 
															         # arrays to hold values for plotting
														
 
															-        self.losses = np.zeros(epochs)
														
 
															-        self.obs_losses = np.zeros(epochs)
														
 
															-        self.physics_losses = np.zeros(epochs)
														
 
															-        self.parameters = [np.zeros(epochs) for _ in self.parameters]
														
 
															+        self.losses = np.zeros(self.epochs)
														
 
															+        self.obs_losses = np.zeros(self.epochs)
														
 
															+        self.physics_losses = np.zeros(self.epochs)
														
 
															+        self.parameters = [np.zeros(self.epochs) for _ in self.parameters]
														
 
															-        for epoch in range(epochs):
														
 
															+        for epoch in range(self.epochs):
														
 
															             # get the prediction and the fitting residuals
														
 
															             prediction = self.model(self.data.t_batch)
														
 
															             residuals = self.problem.residual(prediction, *self.get_regulated_param_list())
														
 
															-            optimizer.zero_grad()
														
 
															+            self.optimizer.zero_grad()
														
 
															             # calculate loss from the differential system
														
 
															             loss_physics = 0
														
@@ -170,11 +214,11 @@ class DINN:
 
															             for i, group in enumerate(self.data.group_names):
														
 
															                 loss_obs += torch.mean(torch.square(self.data.get_norm(group) - prediction[:, i]))
														
 
															-            loss = loss_physics + loss_obs
														
 
															+            loss = loss_obs + loss_physics
														
 
															             loss.backward()
														
 
															-            optimizer.step()
														
 
															-            scheduler.step()
														
 
															+            self.optimizer.step()
														
 
															+            self.scheduler.step()
														
 
															             # append values for plotting
														
 
															             self.losses[epoch] = loss.item()
														
@@ -188,15 +232,18 @@ class DINN:
 
															                 # prediction
														
 
															                 prediction = self.model(self.data.t_batch)
														
 
															                 t = torch.arange(0, self.data.t_raw[-1].item(), (self.data.t_raw[-1] / self.data.t_raw.shape[0]).item())
														
 
															-                groups = self.data.get_denormalized_data([prediction[:, 0], prediction[:, 1], prediction[:, 2]])
														
 
															+                groups = self.data.get_denormalized_data([prediction[:, i] for i in range(self.data.number_groups)])
														
 
															+
														
 
															+                plot_labels = [name + '_pred' for name in self.data.group_names] + [name + '_true' for name in self.data.group_names]
														
 
															+                background_list = [0 for _ in self.data.group_names] + [1 for _ in self.data.group_names]
														
 
															                 self.plotter.plot(t, 
														
 
															                                   list(groups) + list(self.data.data), 
														
 
															-                                  [name + '_pred' for name in self.data.group_names] + [name + '_true' for name in self.data.group_names],
														
 
															+                                  plot_labels,
														
 
															                                   'frame',
														
 
															                                   f'epoch {epoch}',
														
 
															                                   figure_shape=(12, 6),
														
 
															                                   is_frame=True,
														
 
															-                                  is_background=[0, 0, 0, 1, 1, 1],
														
 
															+                                  is_background=background_list,
														
 
															                                   lw=3,
														
 
															                                   legend_loc='upper right',
														
 
															                                   ylim=(0, self.data.N), 
														
@@ -204,19 +251,23 @@ class DINN:
 
															                                   ylabel='amount of people')
														
 
															             # print training advancements
														
 
															-            if epoch % 1000 == 0:          
														
 
															-                print('\nEpoch ', epoch)
														
 
															+            if epoch % 1000 == 0 and verbose:          
														
 
															+                print(f'\nEpoch {epoch} | LR {self.scheduler.get_last_lr()[0]}')
														
 
															                 print(f'physics loss:\t\t{loss_physics.item()}')
														
 
															                 print(f'observation loss:\t{loss_obs.item()}')
														
 
															                 print(f'loss:\t\t\t{loss.item()}')
														
 
															                 print('---------------------------------')
														
 
															-                for parameter in self.parameters_tilda.items():
														
 
															-                    print(f'{parameter[0]}:\t\t\t{self.parameter_regulator(parameter[1]).item()}')
														
 
															-                print('#################################')
														
 
															+                if len(self.parameters_tilda.items()) != 0:
														
 
															+                    for parameter in self.parameters_tilda.items():
														
 
															+                        print(f'{parameter[0]}:\t\t\t{self.parameter_regulator(parameter[1]).item()}')
														
 
															+                    print('#################################')
														
 
															         # create prediction animation
														
 
															         if create_animation:
														
 
															             self.plotter.animate(self.data.name + '_animation')
														
 
															+            self.plotter.reset_animation()
														
 
															+
														
 
															+        self.__has_trained = True
														
 
															     def plot_training_graphs(self, ground_truth=[]):
														
 
															         """Plot the loss graph and the graphs of the advancements of the parameters.
														
@@ -224,7 +275,7 @@ class DINN:
 
															         Args:
														
 
															             ground_truth (list): List of the ground truth parameters
														
 
															         """
														
 
															-        assert self.epochs != None
														
 
															+        assert self.__has_trained, 'Model has to be trained, before plotting the training graphs'
														
 
															         epochs = np.arange(0, self.epochs, 1)
														
 
															         # plot loss
														
@@ -233,8 +284,34 @@ class DINN:
 
															         # plot parameters
														
 
															         for i, parameter in enumerate(self.parameters):
														
 
															             if len(ground_truth) > i:
														
 
															-                self.plotter.plot(epochs, [parameter, np.ones_like(epochs) * ground_truth[i]], ['prediction', 'ground truth'], self.data.name + '_' + list(self.parameters_tilda.items())[i][0], list(self.parameters_tilda.items())[i][0], (6,6), is_background=[0, 1], xlabel='epochs')
														
 
															+                self.plotter.plot(epochs, 
														
 
															+                                  [parameter, 
														
 
															+                                   np.ones_like(epochs) * ground_truth[i]], 
														
 
															+                                   ['prediction', 'ground truth'], 
														
 
															+                                   self.data.name + '_' + list(self.parameters_tilda.items())[i][0], 
														
 
															+                                   list(self.parameters_tilda.items())[i][0], (6,6), 
														
 
															+                                   is_background=[0, 1], 
														
 
															+                                   xlabel='epochs')
														
 
															             else:
														
 
															-                self.plotter.plot(epochs, [parameter], ['prediction'], self.data.name + '_' + list(self.parameters_tilda.items())[i][0], list(self.parameters_tilda.items())[i][0], (6,6), xlabel='epochs', plot_legend=False)
														
 
															-
														
 
															-        
														
 
															+                self.plotter.plot(epochs, 
														
 
															+                                  [parameter], 
														
 
															+                                  ['prediction'], 
														
 
															+                                  self.data.name + '_' + list(self.parameters_tilda.items())[i][0], 
														
 
															+                                  list(self.parameters_tilda.items())[i][0], (6,6), 
														
 
															+                                  xlabel='epochs', 
														
 
															+                                  plot_legend=False)
														
 
															+
														
 
															+    def plot_state_variables(self):
														
 
															+        for i in range(self.data.number_groups, self.data.number_groups+self.number_state_variables):
														
 
															+            prediction = self.model(self.data.t_batch)
														
 
															+            groups = [prediction[:, i] for i in range(self.data.number_groups)]
														
 
															+            t = torch.arange(0, self.data.t_raw[-1].item(), (self.data.t_raw[-1] / self.data.t_raw.shape[0]).item())
														
 
															+            self.plotter.plot(t,
														
 
															+                              [prediction[:, i]] + groups,
														
 
															+                              [self.__state_variables[i-self.data.number_groups]] + self.data.group_names,
														
 
															+                              f'{self.data.name}_{self.__state_variables[i-self.data.number_groups]}',
														
 
															+                              self.__state_variables[i-self.data.number_groups],
														
 
															+                              is_background=[0, 1, 1],
														
 
															+                              figure_shape=(12, 6),
														
 
															+                              plot_legend=True,
														
 
															+                              xlabel='time / days')
														
--- a/src/problem.py
+++ b/src/problem.py
@@ -9,41 +9,73 @@ class PandemicProblem:
 
															             data (PandemicDataset): Dataset holding the time values used.
														
 
															         """
														
 
															-        self.data = data
														
 
															-        self.device_name = data.device_name
														
 
															+        self._data = data
														
 
															+        self._device_name = data.device_name
														
 
															-        #store the gradients for each group
														
 
															-        self.gradients = [torch.zeros((len(data.t_raw), data.number_groups), device=self.device_name) for _ in range(data.number_groups)]
														
 
															-
														
 
															-        for i in range(data.number_groups):
														
 
															-            self.gradients[i][:, i] = 1
														
 
															+        self._gradients = None
														
 
															     def residual(self):
														
 
															         """NEEDS TO BE IMPLEMENTED WHEN INHERITING FROM THIS CLASS
														
 
															         """
														
 
															-        pass
														
 
															+        assert self._gradients != None, 'Gradientmatrix need to be defined'
														
 
															+        
														
 
															+
														
 
															+    def def_grad_matrix(self, number:int):
														
 
															+        assert self._gradients == None, 'Gradientmatrix is already defined'
														
 
															+        self._gradients = [torch.zeros((len(self._data.t_raw), number), device=self._device_name) for _ in range(number)]
														
 
															+        for i in range(number):
														
 
															+            self._gradients[i][:, i] = 1
														
 
															 class SIRProblem(PandemicProblem):
														
 
															     def __init__(self, data: PandemicDataset):
														
 
															         super().__init__(data)
														
 
															     def residual(self, SIR_pred, alpha, beta):
														
 
															-        SIR_pred.backward(self.gradients[0], retain_graph=True)
														
 
															-        dSdt = self.data.t_raw.grad.clone()
														
 
															-        self.data.t_raw.grad.zero_()
														
 
															+        super().residual()
														
 
															+        SIR_pred.backward(self._gradients[0], retain_graph=True)
														
 
															+        dSdt = self._data.t_raw.grad.clone()
														
 
															+        self._data.t_raw.grad.zero_()
														
 
															-        SIR_pred.backward(self.gradients[1], retain_graph=True)
														
 
															-        dIdt = self.data.t_raw.grad.clone()
														
 
															-        self.data.t_raw.grad.zero_()
														
 
															+        SIR_pred.backward(self._gradients[1], retain_graph=True)
														
 
															+        dIdt = self._data.t_raw.grad.clone()
														
 
															+        self._data.t_raw.grad.zero_()
														
 
															-        SIR_pred.backward(self.gradients[2], retain_graph=True)
														
 
															-        dRdt = self.data.t_raw.grad.clone()
														
 
															-        self.data.t_raw.grad.zero_()
														
 
															+        SIR_pred.backward(self._gradients[2], retain_graph=True)
														
 
															+        dRdt = self._data.t_raw.grad.clone()
														
 
															+        self._data.t_raw.grad.zero_()
														
 
															-        S, I, R = self.data.get_denormalized_data([SIR_pred[:, 0], SIR_pred[:, 1], SIR_pred[:, 2]])
														
 
															+        S, I, _ = self._data.get_denormalized_data([SIR_pred[:, 0], SIR_pred[:, 1], SIR_pred[:, 2]])
														
 
															-        S_residual = dSdt - (-beta * ((S * I) / self.data.N)) / (self.data.get_max('S') - self.data.get_min('S'))
														
 
															-        I_residual = dIdt - (beta * ((S * I) / self.data.N) - alpha * I) / (self.data.get_max('I') - self.data.get_min('I'))
														
 
															-        R_residual = dRdt - (alpha * I) / (self.data.get_max('R') - self.data.get_min('R'))
														
 
															+        S_residual = dSdt - (-beta * ((S * I) / self._data.N)) / (self._data.get_max('S') - self._data.get_min('S'))
														
 
															+        I_residual = dIdt - (beta * ((S * I) / self._data.N) - alpha * I) / (self._data.get_max('I') - self._data.get_min('I'))
														
 
															+        R_residual = dRdt - (alpha * I) / (self._data.get_max('R') - self._data.get_min('R'))
														
 
															         return S_residual, I_residual, R_residual
														
 
															+
														
 
															+
														
 
															+class ReducedSIRProblem(PandemicProblem):
														
 
															+    def __init__(self, data: PandemicDataset, alpha:float):
														
 
															+        super().__init__(data)
														
 
															+        self.alpha = alpha
														
 
															+
														
 
															+    def residual(self, SI_pred):
														
 
															+        super().residual()
														
 
															+        SI_pred.backward(self._gradients[0], retain_graph=True)
														
 
															+        dSdt = self._data.t_raw.grad.clone()
														
 
															+        self._data.t_raw.grad.zero_()
														
 
															+
														
 
															+        SI_pred.backward(self._gradients[1], retain_graph=True)
														
 
															+        dIdt = self._data.t_raw.grad.clone()
														
 
															+        self._data.t_raw.grad.zero_()
														
 
															+
														
 
															+        _, I = self._data.get_denormalized_data([SI_pred[:, 0], SI_pred[:, 1]])
														
 
															+        R_t = SI_pred[:, 2]
														
 
															+        # I = SI_pred[:, 1]
														
 
															+
														
 
															+        S_residual = dSdt - (-self.alpha * R_t * I)
														
 
															+        I_residual = dIdt - (self.alpha * (R_t - 1) * I)
														
 
															+
														
 
															+        # print(f'\nTrue:\tI_min: {I.min()}, I_max: {I.max()}\nNorm:\tI_min: {SI_pred[:, 1].min()}, I_max: {SI_pred[:, 1].max()}\nResidual:\t{torch.mean(torch.square(I_residual))}')
														
 
															+
														
 
															+        return S_residual, I_residual
														
 
															+