From 049e1000323982ded2f48afcca452283f3b8caa9 Mon Sep 17 00:00:00 2001
From: Lenz Fiedler <l.fiedler@hzdr.de>
Date: Fri, 22 Nov 2024 12:03:11 +0100
Subject: [PATCH 01/21] Started overhauling the docstrings

---
 mala/common/parallelizer.py  | 13 ++++---
 mala/common/physical_data.py | 66 ++++++++++++++++++++++++++++++++++--
 2 files changed, 71 insertions(+), 8 deletions(-)

diff --git a/mala/common/parallelizer.py b/mala/common/parallelizer.py
index 160695a42..e59b8a984 100644
--- a/mala/common/parallelizer.py
+++ b/mala/common/parallelizer.py
@@ -5,7 +5,6 @@
 import os
 import warnings
 
-import torch
 import torch.distributed as dist
 
 use_ddp = False
@@ -154,6 +153,11 @@ def get_local_rank():
     LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
     FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
     DEALINGS IN THE SOFTWARE.
+
+    Returns
+    -------
+    local_rank : int
+        The local rank of the current thread.
     """
     if use_ddp:
         return int(os.environ.get("LOCAL_RANK"))
@@ -189,7 +193,6 @@ def get_size():
         return comm.Get_size()
 
 
-# TODO: This is hacky, improve it.
 def get_comm():
     """
     Return the MPI communicator, if MPI is being used.
@@ -197,7 +200,7 @@ def get_comm():
     Returns
     -------
     comm : MPI.COMM_WORLD
-        A MPI communicator.
+        An MPI communicator.
 
     """
     return comm
@@ -221,7 +224,7 @@ def printout(*values, sep=" ", min_verbosity=0):
 
     Parameters
     ----------
-    values
+    values : object
         Values to be printed.
 
     sep : string
@@ -245,7 +248,7 @@ def parallel_warn(warning, min_verbosity=0, category=UserWarning):
 
     Parameters
     ----------
-    warning
+    warning : str
         Warning to be printed.
     min_verbosity : int
         Minimum number of verbosity for this output to still be printed.
diff --git a/mala/common/physical_data.py b/mala/common/physical_data.py
index 629378829..3b333a0a6 100644
--- a/mala/common/physical_data.py
+++ b/mala/common/physical_data.py
@@ -12,10 +12,27 @@
 
 class PhysicalData(ABC):
     """
-    Base class for physical data.
+    Base class for volumetric physical data.
 
     Implements general framework to read and write such data to and from
-    files.
+    files. Volumetric data is assumed to exist on a 3D grid. As such it
+    either has the dimensions [x,y,z,f], where f is the feature dimension.
+    All loading functions within this class assume such a 4D array. Within
+    MALA, occasionally 2D arrays of dimension [x*y*z,f] are used and reshaped
+    accordingly.
+
+    Parameters
+    ----------
+    parameters : mala.Parameters
+        MALA Parameters object used to create this class.
+
+    Attributes
+    ----------
+    parameters : mala.Parameters
+        Internal copy of the MALA parameters object
+
+    grid_dimensions : list
+        List of the grid dimensions (x,y,z)
     """
 
     ##############################
@@ -86,6 +103,9 @@ def read_from_numpy_file(
             If not None, the array to save the data into.
             The array has to be 4-dimensional.
 
+        reshape : bool
+            If True, the loaded 4D array will be reshaped into a 2D array.
+
         Returns
         -------
         data : numpy.ndarray or None
@@ -263,6 +283,14 @@ def read_dimensions_from_numpy_file(self, path, read_dtype=False):
 
         read_dtype : bool
             If True, the dtype is read alongside the dimensions.
+
+        Returns
+        -------
+        dimension_info : list or tuple
+            If read_dtype is False, then only a list containing the dimensions
+            of the saved array is returned. If read_dtype is True, a tuple
+            containing this list of dimensions and the dtype of the array will
+            be returned.
         """
         loaded_array = np.load(path, mmap_mode="r")
         if read_dtype:
@@ -286,6 +314,14 @@ def read_dimensions_from_openpmd_file(
 
         read_dtype : bool
             If True, the dtype is read alongside the dimensions.
+
+        comm : MPI.Comm
+            An MPI communicator to be used for parallelized I/O
+
+        Returns
+        -------
+        dimension_info : list
+            A list containing the dimensions of the saved array.
         """
         if comm is None or comm.rank == 0:
             import openpmd_api as io
@@ -379,6 +415,22 @@ class SkipArrayWriting:
 
         In order to provide this data, the numpy array can be replaced with an
         instance of the class SkipArrayWriting.
+
+        Parameters
+        ----------
+        dataset : openpmd_api.Dataset
+            OpenPMD Data set to eventually write to.
+
+        feature_size : int
+            Size of the feature dimension.
+
+        Attributes
+        ----------
+        dataset : mala.Parameters
+            Internal copy of the openPMD Data set to eventually write to.
+
+        feature_size : list
+            Internal copy of the size of the feature dimension.
         """
 
         # dataset has type openpmd_api.Dataset (not adding a type hint to avoid
@@ -408,7 +460,7 @@ def write_to_openpmd_file(
             the openPMD structure.
 
         additional_attributes : dict
-            Dict containing additional attributes to be saved.
+            Dictionary containing additional attributes to be saved.
 
         internal_iteration_number : int
             Internal OpenPMD iteration number. Ideally, this number should
@@ -489,6 +541,14 @@ def write_to_openpmd_iteration(
             If not None, and the selected class implements it, additional
             metadata will be read from this source. This metadata will then,
             depending on the class, be saved in the OpenPMD file.
+
+        local_offset  : int
+
+        local_reach  : int
+
+        feature_from  : int
+
+        feature_to : int
         """
         import openpmd_api as io
 

From b03afcc8d94b823531700a4d325955cbe9105c4d Mon Sep 17 00:00:00 2001
From: Lenz Fiedler <l.fiedler@hzdr.de>
Date: Fri, 22 Nov 2024 15:21:52 +0100
Subject: [PATCH 02/21] Common (except for Parameters) and DataGeneration
 finished

---
 mala/common/physical_data.py               | 14 +++++--
 mala/datageneration/ofdft_initializer.py   | 43 ++++++++++++++++------
 mala/datageneration/trajectory_analyzer.py | 13 +++++++
 3 files changed, 56 insertions(+), 14 deletions(-)

diff --git a/mala/common/physical_data.py b/mala/common/physical_data.py
index 3b333a0a6..19fad8637 100644
--- a/mala/common/physical_data.py
+++ b/mala/common/physical_data.py
@@ -29,7 +29,7 @@ class PhysicalData(ABC):
     Attributes
     ----------
     parameters : mala.Parameters
-        Internal copy of the MALA parameters object
+        Internal copy of the MALA parameters object.
 
     grid_dimensions : list
         List of the grid dimensions (x,y,z)
@@ -542,13 +542,21 @@ def write_to_openpmd_iteration(
             metadata will be read from this source. This metadata will then,
             depending on the class, be saved in the OpenPMD file.
 
-        local_offset  : int
+        local_offset  : list
+            [x,y,z] value from which to start writing the array.
 
-        local_reach  : int
+        local_reach  : list
+            [x,y,z] value until which to read the array.
 
         feature_from  : int
+            Value from which to start writing in the feature dimension. With
+            this parameter and feature_to, one can parallelize over the feature
+            dimension.
 
         feature_to : int
+            Value until which to write in the feature dimension. With
+            this parameter and feature_from, one can parallelize over the feature
+            dimension.
         """
         import openpmd_api as io
 
diff --git a/mala/datageneration/ofdft_initializer.py b/mala/datageneration/ofdft_initializer.py
index 2086b8dbb..0ee142f81 100644
--- a/mala/datageneration/ofdft_initializer.py
+++ b/mala/datageneration/ofdft_initializer.py
@@ -22,12 +22,26 @@ class OFDFTInitializer:
 
     Parameters
     ----------
-    parameters : mala.common.parameters.Parameters
-        Parameters object used to create this instance.
+    parameters : mala.Parameters
+        MALA parameters object used to create this instance.
 
     atoms : ase.Atoms
         Initial atomic configuration for which an equilibrated configuration
         is to be created.
+
+
+    Attributes
+    ----------
+    parameters : mala.Parameters
+        Internal copy of the MALA parameters object.
+
+    atoms : ase.Atoms
+        Internal copy of the initial atomic configuration for which an
+        equilibrated configuration is to be created.
+
+    dftpy_configuration : dict
+        Dictionary containing the DFTpy configuration. Will partially be
+        populated via the MALA parameters object.
     """
 
     def __init__(self, parameters, atoms):
@@ -37,7 +51,7 @@ def __init__(self, parameters, atoms):
             "large changes."
         )
         self.atoms = atoms
-        self.params = parameters.datageneration
+        self.parameters = parameters.datageneration
 
         # Check that only one element is used in the atoms.
         number_of_elements = len(set([x.symbol for x in self.atoms]))
@@ -47,11 +61,13 @@ def __init__(self, parameters, atoms):
             )
         self.dftpy_configuration = DefaultOption()
 
-        self.dftpy_configuration["PATH"]["pppath"] = self.params.local_psp_path
+        self.dftpy_configuration["PATH"][
+            "pppath"
+        ] = self.parameters.local_psp_path
         self.dftpy_configuration["PP"][
             self.atoms[0].symbol
-        ] = self.params.local_psp_name
-        self.dftpy_configuration["OPT"]["method"] = self.params.ofdft_kedf
+        ] = self.parameters.local_psp_name
+        self.dftpy_configuration["OPT"]["method"] = self.parameters.ofdft_kedf
         self.dftpy_configuration["KEDF"]["kedf"] = "WT"
         self.dftpy_configuration["JOB"]["calctype"] = "Energy Force"
 
@@ -64,6 +80,11 @@ def get_equilibrated_configuration(self, logging_period=None):
         logging_period : int
             If not None, a .log and .traj file will be filled with snapshot
             information every logging_period steps.
+
+        Returns
+        -------
+        equilibrated_configuration : ase.Atoms
+            Equilibrated atomic configuration.
         """
         # Set the DFTPy configuration.
         conf = OptionFormat(self.dftpy_configuration)
@@ -75,14 +96,14 @@ def get_equilibrated_configuration(self, logging_period=None):
         # Create the initial velocities, and dynamics object.
         MaxwellBoltzmannDistribution(
             self.atoms,
-            temperature_K=self.params.ofdft_temperature,
+            temperature_K=self.parameters.ofdft_temperature,
             force_temp=True,
         )
         dyn = Langevin(
             self.atoms,
-            self.params.ofdft_timestep * units.fs,
-            temperature_K=self.params.ofdft_temperature,
-            friction=self.params.ofdft_friction,
+            self.parameters.ofdft_timestep * units.fs,
+            temperature_K=self.parameters.ofdft_temperature,
+            friction=self.parameters.ofdft_friction,
         )
 
         # If logging is desired, do the logging.
@@ -105,5 +126,5 @@ def get_equilibrated_configuration(self, logging_period=None):
 
         # Let the OF-DFT-MD run.
         ase.io.write("POSCAR_initial", self.atoms, "vasp")
-        dyn.run(self.params.ofdft_number_of_timesteps)
+        dyn.run(self.parameters.ofdft_number_of_timesteps)
         ase.io.write("POSCAR_equilibrated", self.atoms, "vasp")
diff --git a/mala/datageneration/trajectory_analyzer.py b/mala/datageneration/trajectory_analyzer.py
index 4de1a8d1d..ca34cd1db 100644
--- a/mala/datageneration/trajectory_analyzer.py
+++ b/mala/datageneration/trajectory_analyzer.py
@@ -29,6 +29,19 @@ class TrajectoryAnalyzer:
     target_calculator : mala.targets.target.Target
         A target calculator to calculate e.g. the RDF. If None is provided,
         one will be generated ad-hoc (recommended).
+
+    temperatures : string or numpy.ndarray
+        Array holding the temperatures for the trajectory or path to numpy
+        file containing temperatures.
+
+    target_temperature : float
+        Target temperature for equilibration.
+
+    malada_compatability : bool
+        If True, twice the radius set by the minimum imaging convention (MIC)
+        will be used for RDF calculation. This is generally discouraged,
+        but some older malada calculations have been performed with it, so
+        this parameter provides reproducibility.
     """
 
     def __init__(

From ee158e380773a9074b1324cf915e89297405723f Mon Sep 17 00:00:00 2001
From: Lenz Fiedler <l.fiedler@hzdr.de>
Date: Fri, 22 Nov 2024 15:35:26 +0100
Subject: [PATCH 03/21] Some DataGeneration stuff was wrong

---
 mala/common/physical_data.py               |  6 +-
 mala/datageneration/ofdft_initializer.py   |  6 +-
 mala/datageneration/trajectory_analyzer.py | 71 ++++++++++++++++------
 mala/datahandling/data_converter.py        | 51 ++++++++--------
 4 files changed, 82 insertions(+), 52 deletions(-)

diff --git a/mala/common/physical_data.py b/mala/common/physical_data.py
index 19fad8637..c7dd08f40 100644
--- a/mala/common/physical_data.py
+++ b/mala/common/physical_data.py
@@ -29,7 +29,7 @@ class PhysicalData(ABC):
     Attributes
     ----------
     parameters : mala.Parameters
-        Internal copy of the MALA parameters object.
+        MALA parameters object.
 
     grid_dimensions : list
         List of the grid dimensions (x,y,z)
@@ -427,10 +427,10 @@ class SkipArrayWriting:
         Attributes
         ----------
         dataset : mala.Parameters
-            Internal copy of the openPMD Data set to eventually write to.
+            OpenPMD Data set to eventually write to.
 
         feature_size : list
-            Internal copy of the size of the feature dimension.
+            Size of the feature dimension.
         """
 
         # dataset has type openpmd_api.Dataset (not adding a type hint to avoid
diff --git a/mala/datageneration/ofdft_initializer.py b/mala/datageneration/ofdft_initializer.py
index 0ee142f81..0f932f8c5 100644
--- a/mala/datageneration/ofdft_initializer.py
+++ b/mala/datageneration/ofdft_initializer.py
@@ -32,11 +32,11 @@ class OFDFTInitializer:
 
     Attributes
     ----------
-    parameters : mala.Parameters
-        Internal copy of the MALA parameters object.
+    parameters : mala.mala.common.parameters.ParametersDataGeneration
+        MALA data generation parameters object.
 
     atoms : ase.Atoms
-        Internal copy of the initial atomic configuration for which an
+        Initial atomic configuration for which an
         equilibrated configuration is to be created.
 
     dftpy_configuration : dict
diff --git a/mala/datageneration/trajectory_analyzer.py b/mala/datageneration/trajectory_analyzer.py
index ca34cd1db..09da64ebe 100644
--- a/mala/datageneration/trajectory_analyzer.py
+++ b/mala/datageneration/trajectory_analyzer.py
@@ -42,6 +42,34 @@ class TrajectoryAnalyzer:
         will be used for RDF calculation. This is generally discouraged,
         but some older malada calculations have been performed with it, so
         this parameter provides reproducibility.
+
+    Attributes
+    ----------
+    parameters : mala.common.parameters.ParametersDataGeneration
+        MALA data generation parameters.
+
+    average_distance_equilibrated : float
+        Distance threshold for determination of first equilibrated snapshot.
+
+    distance_metrics_denoised : numpy.ndarray
+        RDF based distance metrics used for equilibration analysis.
+
+    distances_realspace : numpy.ndarray
+        Realspace distance metrics used to sample snapshots.
+
+    first_considered_snapshot : int
+        First snapshot to be considered during equilibration analysis (i.e.,
+        after pruning).
+
+    first_snapshot : int
+        First snapshot that can be considered to be equilibrated.
+
+    last_considered_snapshot : int
+        Last snapshot to be considered during equilibration analysis (i.e.,
+        after pruning).
+
+    target_calculator : mala.targets.target.Target
+        Target calculator used for computing RDFs.
     """
 
     def __init__(
@@ -59,7 +87,7 @@ def __init__(
             "large changes."
         )
 
-        self.params: ParametersDataGeneration = parameters.datageneration
+        self.parameters: ParametersDataGeneration = parameters.datageneration
 
         # If needed, read the trajectory
         self.trajectory = None
@@ -71,12 +99,12 @@ def __init__(
             raise Exception("Incompatible trajectory format provided.")
 
         # If needed, read the temperature files
-        self.temperatures = None
+        self._temperatures = None
         if temperatures is not None:
             if isinstance(temperatures, np.ndarray):
-                self.temperatures = temperatures
+                self._temperatures = temperatures
             elif isinstance(temperatures, str):
-                self.temperatures = np.load(temperatures)
+                self._temperatures = np.load(temperatures)
             else:
                 raise Exception("Incompatible temperature format provided.")
 
@@ -89,7 +117,7 @@ def __init__(
             self.target_calculator.temperature = target_temperature
 
         # Initialize variables.
-        self.distance_metrics = []
+        self._distance_metrics = []
         self.distance_metrics_denoised = []
         self.average_distance_equilibrated = None
         self.__saved_rdf = None
@@ -163,11 +191,11 @@ def get_first_snapshot(
         # First, we ned to calculate the reduced metrics for the trajectory.
         # For this, we calculate the distance between all the snapshots
         # and the last one.
-        self.distance_metrics = []
+        self._distance_metrics = []
         if equilibrated_snapshot is None:
             equilibrated_snapshot = self.trajectory[-1]
         for idx, step in enumerate(self.trajectory):
-            self.distance_metrics.append(
+            self._distance_metrics.append(
                 self._calculate_distance_between_snapshots(
                     equilibrated_snapshot,
                     step,
@@ -178,16 +206,16 @@ def get_first_snapshot(
             )
 
         # Now, we denoise the distance metrics.
-        self.distance_metrics_denoised = self.__denoise(self.distance_metrics)
+        self.distance_metrics_denoised = self.__denoise(self._distance_metrics)
 
         # Which snapshots are considered depends on how we denoise the
         # distance metrics.
         self.first_considered_snapshot = (
-            self.params.trajectory_analysis_denoising_width
+            self.parameters.trajectory_analysis_denoising_width
         )
         self.last_considered_snapshot = (
             np.shape(self.distance_metrics_denoised)[0]
-            - self.params.trajectory_analysis_denoising_width
+            - self.parameters.trajectory_analysis_denoising_width
         )
         considered_length = (
             self.last_considered_snapshot - self.first_considered_snapshot
@@ -202,7 +230,7 @@ def get_first_snapshot(
                 self.distance_metrics_denoised[
                     considered_length
                     - int(
-                        self.params.trajectory_analysis_estimated_equilibrium
+                        self.parameters.trajectory_analysis_estimated_equilibrium
                         * considered_length
                     ) : self.last_considered_snapshot
                 ]
@@ -225,7 +253,7 @@ def get_first_snapshot(
                     is_below = False
                 if (
                     counter
-                    == self.params.trajectory_analysis_below_average_counter
+                    == self.parameters.trajectory_analysis_below_average_counter
                 ):
                     first_snapshot = idx
                     break
@@ -255,10 +283,12 @@ def get_snapshot_correlation_cutoff(self):
             to each other to a degree that suggests temporal neighborhood.
 
         """
-        if self.params.trajectory_analysis_correlation_metric_cutoff < 0:
+        if self.parameters.trajectory_analysis_correlation_metric_cutoff < 0:
             return self._analyze_distance_metric(self.trajectory)
         else:
-            return self.params.trajectory_analysis_correlation_metric_cutoff
+            return (
+                self.parameters.trajectory_analysis_correlation_metric_cutoff
+            )
 
     def get_uncorrelated_snapshots(self, filename_uncorrelated_snapshots):
         """
@@ -278,7 +308,8 @@ def get_uncorrelated_snapshots(self, filename_uncorrelated_snapshots):
             filename_uncorrelated_snapshots
         ).split(".")[0]
         allowed_temp_diff_K = (
-            self.params.trajectory_analysis_temperature_tolerance_percent / 100
+            self.parameters.trajectory_analysis_temperature_tolerance_percent
+            / 100
         ) * self.target_calculator.temperature
         current_snapshot = self.first_snapshot
         begin_snapshot = self.first_snapshot + 1
@@ -288,9 +319,9 @@ def get_uncorrelated_snapshots(self, filename_uncorrelated_snapshots):
         for i in range(begin_snapshot, end_snapshot):
             if self.__check_if_snapshot_is_valid(
                 self.trajectory[i],
-                self.temperatures[i],
+                self._temperatures[i],
                 self.trajectory[current_snapshot],
-                self.temperatures[current_snapshot],
+                self._temperatures[current_snapshot],
                 self.snapshot_correlation_cutoff,
                 allowed_temp_diff_K,
             ):
@@ -329,7 +360,7 @@ def _analyze_distance_metric(self, trajectory):
             + self.first_snapshot
         )
         width = int(
-            self.params.trajectory_analysis_estimated_equilibrium
+            self.parameters.trajectory_analysis_estimated_equilibrium
             * np.shape(self.distance_metrics_denoised)[0]
         )
         self.distances_realspace = []
@@ -416,8 +447,8 @@ def _calculate_distance_between_snapshots(
     def __denoise(self, signal):
         denoised_signal = np.convolve(
             signal,
-            np.ones(self.params.trajectory_analysis_denoising_width)
-            / self.params.trajectory_analysis_denoising_width,
+            np.ones(self.parameters.trajectory_analysis_denoising_width)
+            / self.parameters.trajectory_analysis_denoising_width,
             mode="same",
         )
         return denoised_signal
diff --git a/mala/datahandling/data_converter.py b/mala/datahandling/data_converter.py
index 5b22e2293..fa0b96df4 100644
--- a/mala/datahandling/data_converter.py
+++ b/mala/datahandling/data_converter.py
@@ -43,6 +43,9 @@ class DataConverter:
 
     target_calculator : mala.targets.target.Target
         Target calculator used for parsing/converting target data.
+
+    parameters : mala.Parama
+    parameters_full
     """
 
     def __init__(
@@ -69,9 +72,9 @@ def __init__(
         self.__snapshot_units = []
 
         # Keep track of what has to be done by this data converter.
-        self.process_descriptors = False
-        self.process_targets = False
-        self.process_additional_info = False
+        self.__process_descriptors = False
+        self.__process_targets = False
+        self.__process_additional_info = False
 
     def add_snapshot(
         self,
@@ -143,7 +146,7 @@ def add_snapshot(
                 )
             if descriptor_input_type not in descriptor_input_types:
                 raise Exception("Cannot process this type of descriptor data.")
-            self.process_descriptors = True
+            self.__process_descriptors = True
 
         if target_input_type is not None:
             if target_input_path is None:
@@ -152,7 +155,7 @@ def add_snapshot(
                 )
             if target_input_type not in target_input_types:
                 raise Exception("Cannot process this type of target data.")
-            self.process_targets = True
+            self.__process_targets = True
 
         if additional_info_input_type is not None:
             metadata_input_type = additional_info_input_type
@@ -165,7 +168,7 @@ def add_snapshot(
                 raise Exception(
                     "Cannot process this type of additional info data."
                 )
-            self.process_additional_info = True
+            self.__process_additional_info = True
 
             metadata_input_path = additional_info_input_path
 
@@ -299,19 +302,19 @@ def convert_snapshots(
             target_save_path = complete_save_path
             additional_info_save_path = complete_save_path
         else:
-            if self.process_targets is True and target_save_path is None:
+            if self.__process_targets is True and target_save_path is None:
                 raise Exception(
                     "No target path specified, cannot process data."
                 )
             if (
-                self.process_descriptors is True
+                self.__process_descriptors is True
                 and descriptor_save_path is None
             ):
                 raise Exception(
                     "No descriptor path specified, cannot process data."
                 )
             if (
-                self.process_additional_info is True
+                self.__process_additional_info is True
                 and additional_info_save_path is None
             ):
                 raise Exception(
@@ -323,7 +326,7 @@ def convert_snapshots(
             snapshot_name = naming_scheme
             series_name = snapshot_name.replace("*", str("%01T"))
 
-            if self.process_descriptors:
+            if self.__process_descriptors:
                 if self.parameters._configuration["mpi"]:
                     input_series = io.Series(
                         os.path.join(
@@ -351,7 +354,7 @@ def convert_snapshots(
                 input_series.set_software(name="MALA", version="x.x.x")
                 input_series.author = "..."
 
-            if self.process_targets:
+            if self.__process_targets:
                 if self.parameters._configuration["mpi"]:
                     output_series = io.Series(
                         os.path.join(
@@ -386,7 +389,7 @@ def convert_snapshots(
             snapshot_name = snapshot_name.replace("*", str(snapshot_number))
 
             # Create the paths as needed.
-            if self.process_additional_info:
+            if self.__process_additional_info:
                 info_path = os.path.join(
                     additional_info_save_path, snapshot_name + ".info.json"
                 )
@@ -397,7 +400,7 @@ def convert_snapshots(
 
             if file_ending == "npy":
                 # Create the actual paths, if needed.
-                if self.process_descriptors:
+                if self.__process_descriptors:
                     descriptor_path = os.path.join(
                         descriptor_save_path,
                         snapshot_name + ".in." + file_ending,
@@ -406,7 +409,7 @@ def convert_snapshots(
                     descriptor_path = None
 
                 memmap = None
-                if self.process_targets:
+                if self.__process_targets:
                     target_path = os.path.join(
                         target_save_path,
                         snapshot_name + ".out." + file_ending,
@@ -425,13 +428,13 @@ def convert_snapshots(
                 descriptor_path = None
                 target_path = None
                 memmap = None
-                if self.process_descriptors:
+                if self.__process_descriptors:
                     input_iteration = input_series.write_iterations()[
                         i + starts_at
                     ]
                     input_iteration.dt = i + starts_at
                     input_iteration.time = 0
-                if self.process_targets:
+                if self.__process_targets:
                     output_iteration = output_series.write_iterations()[
                         i + starts_at
                     ]
@@ -460,9 +463,9 @@ def convert_snapshots(
 
         # Properly close series
         if file_ending != "npy":
-            if self.process_descriptors:
+            if self.__process_descriptors:
                 del input_series
-            if self.process_targets:
+            if self.__process_targets:
                 del output_series
 
     def __convert_single_snapshot(
@@ -636,10 +639,8 @@ def __convert_single_snapshot(
                         snapshot["output"], units=original_units["output"]
                     )
                 elif description["output"] == "numpy":
-                    tmp_output = (
-                        self.target_calculator.read_from_numpy_file(
-                            snapshot["output"], units=original_units["output"]
-                        )
+                    tmp_output = self.target_calculator.read_from_numpy_file(
+                        snapshot["output"], units=original_units["output"]
                     )
 
                 elif description["output"] is None:
@@ -687,10 +688,8 @@ def __convert_single_snapshot(
                         snapshot["output"], units=original_units["output"]
                     )
                 elif description["output"] == "numpy":
-                    tmp_output = (
-                        self.target_calculator.read_from_numpy_file(
-                            snapshot["output"]
-                        )
+                    tmp_output = self.target_calculator.read_from_numpy_file(
+                        snapshot["output"]
                     )
 
                 elif description["output"] is None:

From 9fe2f95f9f40571c41ec41baff0711c24f6712c0 Mon Sep 17 00:00:00 2001
From: Lenz Fiedler <l.fiedler@hzdr.de>
Date: Fri, 22 Nov 2024 15:38:48 +0100
Subject: [PATCH 04/21] DataConverter

---
 mala/datahandling/data_converter.py | 11 ++++++-----
 1 file changed, 6 insertions(+), 5 deletions(-)

diff --git a/mala/datahandling/data_converter.py b/mala/datahandling/data_converter.py
index fa0b96df4..21fb34cdb 100644
--- a/mala/datahandling/data_converter.py
+++ b/mala/datahandling/data_converter.py
@@ -44,8 +44,12 @@ class DataConverter:
     target_calculator : mala.targets.target.Target
         Target calculator used for parsing/converting target data.
 
-    parameters : mala.Parama
-    parameters_full
+    parameters : mala.common.parameters.ParametersData
+        MALA data handling parameters object.
+
+    parameters_full : mala.common.parameters.Parameters
+        MALA parameters object. The full object is necessary for some data
+        handling tasks.
     """
 
     def __init__(
@@ -503,9 +507,6 @@ def __convert_single_snapshot(
         output_path : string
             If not None, outputs will be saved in this file.
 
-        return_data : bool
-            If True, inputs and outputs will be returned directly.
-
         target_calculator_kwargs : dict
             Dictionary with additional keyword arguments for the calculation
             or parsing of the target quantities.

From 0323864f2b5d1b89bf7d4add766ae35400094da2 Mon Sep 17 00:00:00 2001
From: Lenz Fiedler <l.fiedler@hzdr.de>
Date: Fri, 22 Nov 2024 15:58:02 +0100
Subject: [PATCH 05/21] Done data handler

---
 mala/datahandling/data_handler.py | 146 +++++++++++++++++++-----------
 1 file changed, 93 insertions(+), 53 deletions(-)

diff --git a/mala/datahandling/data_handler.py b/mala/datahandling/data_handler.py
index 7b8fc2a43..85ec098e3 100644
--- a/mala/datahandling/data_handler.py
+++ b/mala/datahandling/data_handler.py
@@ -18,10 +18,10 @@
 
 class DataHandler(DataHandlerBase):
     """
-    Loads and scales data. Can only process numpy arrays at the moment.
+    Loads and scales data. Can load from numpy or OpenPMD files.
 
-    Data that is not in a numpy array can be converted using the DataConverter
-    class.
+    Data that is not saved as numpy or OpenPMD file can be converted using the
+    DataConverter class.
 
     Parameters
     ----------
@@ -47,6 +47,41 @@ class DataHandler(DataHandlerBase):
     clear_data : bool
         If true (default), the data list will be cleared upon creation of
         the object.
+
+    Attributes
+    ----------
+    input_data_scaler : mala.datahandling.data_scaler.DataScaler
+        Used to scale the input data.
+
+    nr_test_data : int
+        Number of test data points.
+
+    nr_test_snapshots : int
+        Number of test snapshots.
+
+    nr_training_data : int
+        Number of training data points.
+
+    nr_training_snapshots : int
+        Number of training snapshots.
+
+    nr_validation_data : int
+        Number of validation data points.
+
+    nr_validation_snapshots : int
+        Number of validation snapshots.
+
+    output_data_scaler : mala.datahandling.data_scaler.DataScaler
+        Used to scale the output data.
+
+    test_data_sets : list
+        List containing torch data sets for test data.
+
+    training_data_sets : list
+        List containing torch data sets for training data.
+
+    validation_data_sets : list
+        List containing torch data sets for validation data.
     """
 
     ##############################
@@ -93,18 +128,18 @@ def __init__(
         self.nr_validation_snapshots = 0
 
         # Arrays and data sets containing the actual data.
-        self.training_data_inputs = torch.empty(0)
-        self.validation_data_inputs = torch.empty(0)
-        self.test_data_inputs = torch.empty(0)
-        self.training_data_outputs = torch.empty(0)
-        self.validation_data_outputs = torch.empty(0)
-        self.test_data_outputs = torch.empty(0)
+        self._training_data_inputs = torch.empty(0)
+        self._validation_data_inputs = torch.empty(0)
+        self._test_data_inputs = torch.empty(0)
+        self._training_data_outputs = torch.empty(0)
+        self._validation_data_outputs = torch.empty(0)
+        self._test_data_outputs = torch.empty(0)
         self.training_data_sets = []
         self.validation_data_sets = []
         self.test_data_sets = []
 
         # Needed for the fast tensor data sets.
-        self.mini_batch_size = parameters.running.mini_batch_size
+        self._mini_batch_size = parameters.running.mini_batch_size
         if clear_data:
             self.clear_data()
 
@@ -258,7 +293,7 @@ def get_test_input_gradient(self, snapshot_number):
 
         Returns
         -------
-        torch.Tensor
+        gradient : torch.Tensor
             Tensor holding the gradient.
 
         """
@@ -274,7 +309,7 @@ def get_test_input_gradient(self, snapshot_number):
                 )
             return self.test_data_sets[0].input_data.grad
         else:
-            return self.test_data_inputs.grad[
+            return self._test_data_inputs.grad[
                 snapshot.grid_size
                 * snapshot_number : snapshot.grid_size
                 * (snapshot_number + 1)
@@ -315,11 +350,14 @@ def raw_numpy_to_converted_scaled_tensor(
         ----------
         numpy_array : np.array
             Array that is to be converted.
+
         data_type : string
             Either "in" or "out", depending if input or output data is
+
             processed.
         units : string
             Units of the data that is processed.
+
         convert3Dto1D : bool
             If True (default: False), then a (x,y,z,dim) array is transformed
             into a (x*y*z,dim) array.
@@ -479,31 +517,31 @@ def _check_snapshots(self):
 
     def __allocate_arrays(self):
         if self.nr_training_data > 0:
-            self.training_data_inputs = np.zeros(
+            self._training_data_inputs = np.zeros(
                 (self.nr_training_data, self.input_dimension),
                 dtype=DEFAULT_NP_DATA_DTYPE,
             )
-            self.training_data_outputs = np.zeros(
+            self._training_data_outputs = np.zeros(
                 (self.nr_training_data, self.output_dimension),
                 dtype=DEFAULT_NP_DATA_DTYPE,
             )
 
         if self.nr_validation_data > 0:
-            self.validation_data_inputs = np.zeros(
+            self._validation_data_inputs = np.zeros(
                 (self.nr_validation_data, self.input_dimension),
                 dtype=DEFAULT_NP_DATA_DTYPE,
             )
-            self.validation_data_outputs = np.zeros(
+            self._validation_data_outputs = np.zeros(
                 (self.nr_validation_data, self.output_dimension),
                 dtype=DEFAULT_NP_DATA_DTYPE,
             )
 
         if self.nr_test_data > 0:
-            self.test_data_inputs = np.zeros(
+            self._test_data_inputs = np.zeros(
                 (self.nr_test_data, self.input_dimension),
                 dtype=DEFAULT_NP_DATA_DTYPE,
             )
-            self.test_data_outputs = np.zeros(
+            self._test_data_outputs = np.zeros(
                 (self.nr_test_data, self.output_dimension),
                 dtype=DEFAULT_NP_DATA_DTYPE,
             )
@@ -593,34 +631,34 @@ def __load_data(self, function, data_type):
         # all ears.
         if data_type == "inputs":
             if function == "training":
-                self.training_data_inputs = torch.from_numpy(
-                    self.training_data_inputs
+                self._training_data_inputs = torch.from_numpy(
+                    self._training_data_inputs
                 ).float()
 
             if function == "validation":
-                self.validation_data_inputs = torch.from_numpy(
-                    self.validation_data_inputs
+                self._validation_data_inputs = torch.from_numpy(
+                    self._validation_data_inputs
                 ).float()
 
             if function == "test":
-                self.test_data_inputs = torch.from_numpy(
-                    self.test_data_inputs
+                self._test_data_inputs = torch.from_numpy(
+                    self._test_data_inputs
                 ).float()
 
         if data_type == "outputs":
             if function == "training":
-                self.training_data_outputs = torch.from_numpy(
-                    self.training_data_outputs
+                self._training_data_outputs = torch.from_numpy(
+                    self._training_data_outputs
                 ).float()
 
             if function == "validation":
-                self.validation_data_outputs = torch.from_numpy(
-                    self.validation_data_outputs
+                self._validation_data_outputs = torch.from_numpy(
+                    self._validation_data_outputs
                 ).float()
 
             if function == "test":
-                self.test_data_outputs = torch.from_numpy(
-                    self.test_data_outputs
+                self._test_data_outputs = torch.from_numpy(
+                    self._test_data_outputs
                 ).float()
 
     def __build_datasets(self):
@@ -701,7 +739,7 @@ def __build_datasets(self):
                 if snapshot.snapshot_function == "tr":
                     self.training_data_sets.append(
                         LazyLoadDatasetSingle(
-                            self.mini_batch_size,
+                            self._mini_batch_size,
                             snapshot,
                             self.input_dimension,
                             self.output_dimension,
@@ -715,7 +753,7 @@ def __build_datasets(self):
                 if snapshot.snapshot_function == "va":
                     self.validation_data_sets.append(
                         LazyLoadDatasetSingle(
-                            self.mini_batch_size,
+                            self._mini_batch_size,
                             snapshot,
                             self.input_dimension,
                             self.output_dimension,
@@ -729,7 +767,7 @@ def __build_datasets(self):
                 if snapshot.snapshot_function == "te":
                     self.test_data_sets.append(
                         LazyLoadDatasetSingle(
-                            self.mini_batch_size,
+                            self._mini_batch_size,
                             snapshot,
                             self.input_dimension,
                             self.output_dimension,
@@ -744,58 +782,60 @@ def __build_datasets(self):
 
         else:
             if self.nr_training_data != 0:
-                self.input_data_scaler.transform(self.training_data_inputs)
-                self.output_data_scaler.transform(self.training_data_outputs)
+                self.input_data_scaler.transform(self._training_data_inputs)
+                self.output_data_scaler.transform(self._training_data_outputs)
                 if self.parameters.use_fast_tensor_data_set:
                     printout("Using FastTensorDataset.", min_verbosity=2)
                     self.training_data_sets.append(
                         FastTensorDataset(
-                            self.mini_batch_size,
-                            self.training_data_inputs,
-                            self.training_data_outputs,
+                            self._mini_batch_size,
+                            self._training_data_inputs,
+                            self._training_data_outputs,
                         )
                     )
                 else:
                     self.training_data_sets.append(
                         TensorDataset(
-                            self.training_data_inputs,
-                            self.training_data_outputs,
+                            self._training_data_inputs,
+                            self._training_data_outputs,
                         )
                     )
 
             if self.nr_validation_data != 0:
                 self.__load_data("validation", "inputs")
-                self.input_data_scaler.transform(self.validation_data_inputs)
+                self.input_data_scaler.transform(self._validation_data_inputs)
 
                 self.__load_data("validation", "outputs")
-                self.output_data_scaler.transform(self.validation_data_outputs)
+                self.output_data_scaler.transform(
+                    self._validation_data_outputs
+                )
                 if self.parameters.use_fast_tensor_data_set:
                     printout("Using FastTensorDataset.", min_verbosity=2)
                     self.validation_data_sets.append(
                         FastTensorDataset(
-                            self.mini_batch_size,
-                            self.validation_data_inputs,
-                            self.validation_data_outputs,
+                            self._mini_batch_size,
+                            self._validation_data_inputs,
+                            self._validation_data_outputs,
                         )
                     )
                 else:
                     self.validation_data_sets.append(
                         TensorDataset(
-                            self.validation_data_inputs,
-                            self.validation_data_outputs,
+                            self._validation_data_inputs,
+                            self._validation_data_outputs,
                         )
                     )
 
             if self.nr_test_data != 0:
                 self.__load_data("test", "inputs")
-                self.input_data_scaler.transform(self.test_data_inputs)
-                self.test_data_inputs.requires_grad = True
+                self.input_data_scaler.transform(self._test_data_inputs)
+                self._test_data_inputs.requires_grad = True
 
                 self.__load_data("test", "outputs")
-                self.output_data_scaler.transform(self.test_data_outputs)
+                self.output_data_scaler.transform(self._test_data_outputs)
                 self.test_data_sets.append(
                     TensorDataset(
-                        self.test_data_inputs, self.test_data_outputs
+                        self._test_data_inputs, self._test_data_outputs
                     )
                 )
 
@@ -859,7 +899,7 @@ def __parametrize_scalers(self):
 
         else:
             self.__load_data("training", "inputs")
-            self.input_data_scaler.fit(self.training_data_inputs)
+            self.input_data_scaler.fit(self._training_data_inputs)
 
         printout("Input scaler parametrized.", min_verbosity=1)
 
@@ -918,7 +958,7 @@ def __parametrize_scalers(self):
 
         else:
             self.__load_data("training", "outputs")
-            self.output_data_scaler.fit(self.training_data_outputs)
+            self.output_data_scaler.fit(self._training_data_outputs)
 
         printout("Output scaler parametrized.", min_verbosity=1)
 

From dffb463c2016a0c69770098b4d326945df92855d Mon Sep 17 00:00:00 2001
From: Lenz Fiedler <l.fiedler@hzdr.de>
Date: Fri, 22 Nov 2024 16:09:30 +0100
Subject: [PATCH 06/21] Forgot to change an attribute reference

---
 mala/datahandling/data_handler.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/mala/datahandling/data_handler.py b/mala/datahandling/data_handler.py
index 85ec098e3..0b6017361 100644
--- a/mala/datahandling/data_handler.py
+++ b/mala/datahandling/data_handler.py
@@ -569,7 +569,7 @@ def __load_data(self, function, data_type):
             raise Exception("Unknown data type detected.")
 
         # Extracting all the information pertaining to the data set.
-        array = function + "_data_" + data_type
+        array = "_" + function + "_data_" + data_type
         if data_type == "inputs":
             calculator = self.descriptor_calculator
         else:

From 59b629cd489fb4e2f98e71d38dcd41ab32e377c6 Mon Sep 17 00:00:00 2001
From: Lenz Fiedler <l.fiedler@hzdr.de>
Date: Fri, 22 Nov 2024 16:23:11 +0100
Subject: [PATCH 07/21] Did DataHandlerBase

---
 mala/datahandling/data_handler.py      | 16 ++++++++--------
 mala/datahandling/data_handler_base.py | 16 +++++++++++++++-
 2 files changed, 23 insertions(+), 9 deletions(-)

diff --git a/mala/datahandling/data_handler.py b/mala/datahandling/data_handler.py
index 0b6017361..ced970960 100644
--- a/mala/datahandling/data_handler.py
+++ b/mala/datahandling/data_handler.py
@@ -107,14 +107,14 @@ def __init__(
         if self.input_data_scaler is None:
             self.input_data_scaler = DataScaler(
                 self.parameters.input_rescaling_type,
-                use_ddp=self.use_ddp,
+                use_ddp=self._use_ddp,
             )
 
         self.output_data_scaler = output_data_scaler
         if self.output_data_scaler is None:
             self.output_data_scaler = DataScaler(
                 self.parameters.output_rescaling_type,
-                use_ddp=self.use_ddp,
+                use_ddp=self._use_ddp,
             )
 
         # Actual data points in the different categories.
@@ -677,7 +677,7 @@ def __build_datasets(self):
                     self.output_data_scaler,
                     self.descriptor_calculator,
                     self.target_calculator,
-                    self.use_ddp,
+                    self._use_ddp,
                     self.parameters._configuration["device"],
                 )
             )
@@ -689,7 +689,7 @@ def __build_datasets(self):
                     self.output_data_scaler,
                     self.descriptor_calculator,
                     self.target_calculator,
-                    self.use_ddp,
+                    self._use_ddp,
                     self.parameters._configuration["device"],
                 )
             )
@@ -703,7 +703,7 @@ def __build_datasets(self):
                         self.output_data_scaler,
                         self.descriptor_calculator,
                         self.target_calculator,
-                        self.use_ddp,
+                        self._use_ddp,
                         self.parameters._configuration["device"],
                         input_requires_grad=True,
                     )
@@ -747,7 +747,7 @@ def __build_datasets(self):
                             self.output_data_scaler,
                             self.descriptor_calculator,
                             self.target_calculator,
-                            self.use_ddp,
+                            self._use_ddp,
                         )
                     )
                 if snapshot.snapshot_function == "va":
@@ -761,7 +761,7 @@ def __build_datasets(self):
                             self.output_data_scaler,
                             self.descriptor_calculator,
                             self.target_calculator,
-                            self.use_ddp,
+                            self._use_ddp,
                         )
                     )
                 if snapshot.snapshot_function == "te":
@@ -775,7 +775,7 @@ def __build_datasets(self):
                             self.output_data_scaler,
                             self.descriptor_calculator,
                             self.target_calculator,
-                            self.use_ddp,
+                            self._use_ddp,
                             input_requires_grad=True,
                         )
                     )
diff --git a/mala/datahandling/data_handler_base.py b/mala/datahandling/data_handler_base.py
index 54e27e959..c141551fa 100644
--- a/mala/datahandling/data_handler_base.py
+++ b/mala/datahandling/data_handler_base.py
@@ -28,6 +28,20 @@ class DataHandlerBase(ABC):
     target_calculator : mala.targets.target.Target
         Used to do unit conversion on output data. If None, then one will
         be created by this class.
+
+    Attributes
+    ----------
+    descriptor_calculator
+        Used to do unit conversion on input data.
+
+    nr_snapshots : int
+        Number of snapshots loaded.
+
+    parameters : mala.common.parameters.ParametersData
+        MALA data handling parameters.
+
+    target_calculator
+        Used to do unit conversion on output data.
     """
 
     def __init__(
@@ -37,7 +51,7 @@ def __init__(
         descriptor_calculator=None,
     ):
         self.parameters: ParametersData = parameters.data
-        self.use_ddp = parameters.use_ddp
+        self._use_ddp = parameters.use_ddp
 
         # Calculators used to parse data from compatible files.
         self.target_calculator = target_calculator

From 6721a7fdac1f3b3205a25653b0e3963cb5c6e842 Mon Sep 17 00:00:00 2001
From: Lenz Fiedler <l.fiedler@hzdr.de>
Date: Fri, 22 Nov 2024 16:40:02 +0100
Subject: [PATCH 08/21] Did DataScaler, changes will have to be merged with
 data scaling PR

---
 mala/datahandling/data_scaler.py | 248 ++++++++++++++++---------------
 test/all_lazy_loading_test.py    |  32 ++--
 2 files changed, 146 insertions(+), 134 deletions(-)

diff --git a/mala/datahandling/data_scaler.py b/mala/datahandling/data_scaler.py
index e3c8a5328..3ecf39881 100644
--- a/mala/datahandling/data_scaler.py
+++ b/mala/datahandling/data_scaler.py
@@ -32,45 +32,50 @@ class DataScaler:
     use_ddp : bool
         If True, the DataScaler will use ddp to check that data is
         only saved on the root process in parallel execution.
+
+    Attributes
+    ----------
+    cantransform : bool
+        If True, this scaler is set up to perform scaling.
     """
 
     def __init__(self, typestring, use_ddp=False):
-        self.use_ddp = use_ddp
-        self.typestring = typestring
-        self.scale_standard = False
-        self.scale_normal = False
-        self.feature_wise = False
+        self._use_ddp = use_ddp
+        self._typestring = typestring
+        self._scale_standard = False
+        self._scale_normal = False
+        self._feature_wise = False
         self.cantransform = False
         self.__parse_typestring()
 
-        self.means = torch.empty(0)
-        self.stds = torch.empty(0)
-        self.maxs = torch.empty(0)
-        self.mins = torch.empty(0)
-        self.total_mean = torch.tensor(0)
-        self.total_std = torch.tensor(0)
-        self.total_max = torch.tensor(float("-inf"))
-        self.total_min = torch.tensor(float("inf"))
+        self._means = torch.empty(0)
+        self._stds = torch.empty(0)
+        self._maxs = torch.empty(0)
+        self._mins = torch.empty(0)
+        self._total_mean = torch.tensor(0)
+        self._total_std = torch.tensor(0)
+        self._total_max = torch.tensor(float("-inf"))
+        self._total_min = torch.tensor(float("inf"))
 
-        self.total_data_count = 0
+        self._total_data_count = 0
 
     def __parse_typestring(self):
         """Parse the typestring to class attributes."""
-        self.scale_standard = False
-        self.scale_normal = False
-        self.feature_wise = False
-
-        if "standard" in self.typestring:
-            self.scale_standard = True
-        if "normal" in self.typestring:
-            self.scale_normal = True
-        if "feature-wise" in self.typestring:
-            self.feature_wise = True
-        if self.scale_standard is False and self.scale_normal is False:
+        self._scale_standard = False
+        self._scale_normal = False
+        self._feature_wise = False
+
+        if "standard" in self._typestring:
+            self._scale_standard = True
+        if "normal" in self._typestring:
+            self._scale_normal = True
+        if "feature-wise" in self._typestring:
+            self._feature_wise = True
+        if self._scale_standard is False and self._scale_normal is False:
             printout("No data rescaling will be performed.", min_verbosity=1)
             self.cantransform = True
             return
-        if self.scale_standard is True and self.scale_normal is True:
+        if self._scale_standard is True and self._scale_normal is True:
             raise Exception("Invalid input data rescaling.")
 
     def start_incremental_fitting(self):
@@ -79,7 +84,7 @@ def start_incremental_fitting(self):
 
         This is necessary for lazy loading.
         """
-        self.total_data_count = 0
+        self._total_data_count = 0
 
     def incremental_fit(self, unscaled):
         """
@@ -93,71 +98,71 @@ def incremental_fit(self, unscaled):
             Data that is to be added to the fit.
 
         """
-        if self.scale_standard is False and self.scale_normal is False:
+        if self._scale_standard is False and self._scale_normal is False:
             return
         else:
             with torch.no_grad():
-                if self.feature_wise:
+                if self._feature_wise:
 
                     ##########################
                     # Feature-wise-scaling
                     ##########################
 
-                    if self.scale_standard:
+                    if self._scale_standard:
                         new_mean = torch.mean(unscaled, 0, keepdim=True)
                         new_std = torch.std(unscaled, 0, keepdim=True)
 
                         current_data_count = list(unscaled.size())[0]
 
-                        old_mean = self.means
-                        old_std = self.stds
+                        old_mean = self._means
+                        old_std = self._stds
 
-                        if list(self.means.size())[0] > 0:
-                            self.means = (
-                                self.total_data_count
-                                / (self.total_data_count + current_data_count)
+                        if list(self._means.size())[0] > 0:
+                            self._means = (
+                                self._total_data_count
+                                / (self._total_data_count + current_data_count)
                                 * old_mean
                                 + current_data_count
-                                / (self.total_data_count + current_data_count)
+                                / (self._total_data_count + current_data_count)
                                 * new_mean
                             )
                         else:
-                            self.means = new_mean
-                        if list(self.stds.size())[0] > 0:
-                            self.stds = (
-                                self.total_data_count
-                                / (self.total_data_count + current_data_count)
+                            self._means = new_mean
+                        if list(self._stds.size())[0] > 0:
+                            self._stds = (
+                                self._total_data_count
+                                / (self._total_data_count + current_data_count)
                                 * old_std**2
                                 + current_data_count
-                                / (self.total_data_count + current_data_count)
+                                / (self._total_data_count + current_data_count)
                                 * new_std**2
-                                + (self.total_data_count * current_data_count)
-                                / (self.total_data_count + current_data_count)
+                                + (self._total_data_count * current_data_count)
+                                / (self._total_data_count + current_data_count)
                                 ** 2
                                 * (old_mean - new_mean) ** 2
                             )
 
-                            self.stds = torch.sqrt(self.stds)
+                            self._stds = torch.sqrt(self._stds)
                         else:
-                            self.stds = new_std
-                        self.total_data_count += current_data_count
+                            self._stds = new_std
+                        self._total_data_count += current_data_count
 
-                    if self.scale_normal:
+                    if self._scale_normal:
                         new_maxs = torch.max(unscaled, 0, keepdim=True)
-                        if list(self.maxs.size())[0] > 0:
+                        if list(self._maxs.size())[0] > 0:
                             for i in range(list(new_maxs.values.size())[1]):
-                                if new_maxs.values[0, i] > self.maxs[i]:
-                                    self.maxs[i] = new_maxs.values[0, i]
+                                if new_maxs.values[0, i] > self._maxs[i]:
+                                    self._maxs[i] = new_maxs.values[0, i]
                         else:
-                            self.maxs = new_maxs.values[0, :]
+                            self._maxs = new_maxs.values[0, :]
 
                         new_mins = torch.min(unscaled, 0, keepdim=True)
-                        if list(self.mins.size())[0] > 0:
+                        if list(self._mins.size())[0] > 0:
                             for i in range(list(new_mins.values.size())[1]):
-                                if new_mins.values[0, i] < self.mins[i]:
-                                    self.mins[i] = new_mins.values[0, i]
+                                if new_mins.values[0, i] < self._mins[i]:
+                                    self._mins[i] = new_mins.values[0, i]
                         else:
-                            self.mins = new_mins.values[0, :]
+                            self._mins = new_mins.values[0, :]
 
                 else:
 
@@ -165,7 +170,7 @@ def incremental_fit(self, unscaled):
                     # Total scaling
                     ##########################
 
-                    if self.scale_standard:
+                    if self._scale_standard:
                         current_data_count = (
                             list(unscaled.size())[0] * list(unscaled.size())[1]
                         )
@@ -173,15 +178,15 @@ def incremental_fit(self, unscaled):
                         new_mean = torch.mean(unscaled)
                         new_std = torch.std(unscaled)
 
-                        old_mean = self.total_mean
-                        old_std = self.total_std
+                        old_mean = self._total_mean
+                        old_std = self._total_std
 
-                        self.total_mean = (
-                            self.total_data_count
-                            / (self.total_data_count + current_data_count)
+                        self._total_mean = (
+                            self._total_data_count
+                            / (self._total_data_count + current_data_count)
                             * old_mean
                             + current_data_count
-                            / (self.total_data_count + current_data_count)
+                            / (self._total_data_count + current_data_count)
                             * new_mean
                         )
 
@@ -190,29 +195,30 @@ def incremental_fit(self, unscaled):
                         # results.
                         # Maybe we should check it at some point .
                         # I think it is merely an issue of numerical accuracy.
-                        self.total_std = (
-                            self.total_data_count
-                            / (self.total_data_count + current_data_count)
+                        self._total_std = (
+                            self._total_data_count
+                            / (self._total_data_count + current_data_count)
                             * old_std**2
                             + current_data_count
-                            / (self.total_data_count + current_data_count)
+                            / (self._total_data_count + current_data_count)
                             * new_std**2
-                            + (self.total_data_count * current_data_count)
-                            / (self.total_data_count + current_data_count) ** 2
+                            + (self._total_data_count * current_data_count)
+                            / (self._total_data_count + current_data_count)
+                            ** 2
                             * (old_mean - new_mean) ** 2
                         )
 
-                        self.total_std = torch.sqrt(self.total_std)
-                        self.total_data_count += current_data_count
+                        self._total_std = torch.sqrt(self._total_std)
+                        self._total_data_count += current_data_count
 
-                    if self.scale_normal:
+                    if self._scale_normal:
                         new_max = torch.max(unscaled)
-                        if new_max > self.total_max:
-                            self.total_max = new_max
+                        if new_max > self._total_max:
+                            self._total_max = new_max
 
                         new_min = torch.min(unscaled)
-                        if new_min < self.total_min:
-                            self.total_min = new_min
+                        if new_min < self._total_min:
+                            self._total_min = new_min
 
     def finish_incremental_fitting(self):
         """
@@ -232,23 +238,27 @@ def fit(self, unscaled):
             Data that on which the scaling will be calculated.
 
         """
-        if self.scale_standard is False and self.scale_normal is False:
+        if self._scale_standard is False and self._scale_normal is False:
             return
         else:
             with torch.no_grad():
-                if self.feature_wise:
+                if self._feature_wise:
 
                     ##########################
                     # Feature-wise-scaling
                     ##########################
 
-                    if self.scale_standard:
-                        self.means = torch.mean(unscaled, 0, keepdim=True)
-                        self.stds = torch.std(unscaled, 0, keepdim=True)
+                    if self._scale_standard:
+                        self._means = torch.mean(unscaled, 0, keepdim=True)
+                        self._stds = torch.std(unscaled, 0, keepdim=True)
 
-                    if self.scale_normal:
-                        self.maxs = torch.max(unscaled, 0, keepdim=True).values
-                        self.mins = torch.min(unscaled, 0, keepdim=True).values
+                    if self._scale_normal:
+                        self._maxs = torch.max(
+                            unscaled, 0, keepdim=True
+                        ).values
+                        self._mins = torch.min(
+                            unscaled, 0, keepdim=True
+                        ).values
 
                 else:
 
@@ -256,13 +266,13 @@ def fit(self, unscaled):
                     # Total scaling
                     ##########################
 
-                    if self.scale_standard:
-                        self.total_mean = torch.mean(unscaled)
-                        self.total_std = torch.std(unscaled)
+                    if self._scale_standard:
+                        self._total_mean = torch.mean(unscaled)
+                        self._total_std = torch.std(unscaled)
 
-                    if self.scale_normal:
-                        self.total_max = torch.max(unscaled)
-                        self.total_min = torch.min(unscaled)
+                    if self._scale_normal:
+                        self._total_max = torch.max(unscaled)
+                        self._total_min = torch.min(unscaled)
 
         self.cantransform = True
 
@@ -284,7 +294,7 @@ def transform(self, unscaled):
             Scaled data.
         """
         # First we need to find out if we even have to do anything.
-        if self.scale_standard is False and self.scale_normal is False:
+        if self._scale_standard is False and self._scale_normal is False:
             pass
 
         elif self.cantransform is False:
@@ -296,19 +306,19 @@ def transform(self, unscaled):
         # Perform the actual scaling, but use no_grad to make sure
         # that the next couple of iterations stay untracked.
         with torch.no_grad():
-            if self.feature_wise:
+            if self._feature_wise:
 
                 ##########################
                 # Feature-wise-scaling
                 ##########################
 
-                if self.scale_standard:
-                    unscaled -= self.means
-                    unscaled /= self.stds
+                if self._scale_standard:
+                    unscaled -= self._means
+                    unscaled /= self._stds
 
-                if self.scale_normal:
-                    unscaled -= self.mins
-                    unscaled /= self.maxs - self.mins
+                if self._scale_normal:
+                    unscaled -= self._mins
+                    unscaled /= self._maxs - self._mins
 
             else:
 
@@ -316,13 +326,13 @@ def transform(self, unscaled):
                 # Total scaling
                 ##########################
 
-                if self.scale_standard:
-                    unscaled -= self.total_mean
-                    unscaled /= self.total_std
+                if self._scale_standard:
+                    unscaled -= self._total_mean
+                    unscaled /= self._total_std
 
-                if self.scale_normal:
-                    unscaled -= self.total_min
-                    unscaled /= self.total_max - self.total_min
+                if self._scale_normal:
+                    unscaled -= self._total_min
+                    unscaled /= self._total_max - self._total_min
 
     def inverse_transform(self, scaled, as_numpy=False):
         """
@@ -346,7 +356,7 @@ def inverse_transform(self, scaled, as_numpy=False):
 
         """
         # First we need to find out if we even have to do anything.
-        if self.scale_standard is False and self.scale_normal is False:
+        if self._scale_standard is False and self._scale_normal is False:
             unscaled = scaled
 
         else:
@@ -359,19 +369,19 @@ def inverse_transform(self, scaled, as_numpy=False):
             # Perform the actual scaling, but use no_grad to make sure
             # that the next couple of iterations stay untracked.
             with torch.no_grad():
-                if self.feature_wise:
+                if self._feature_wise:
 
                     ##########################
                     # Feature-wise-scaling
                     ##########################
 
-                    if self.scale_standard:
-                        unscaled = (scaled * self.stds) + self.means
+                    if self._scale_standard:
+                        unscaled = (scaled * self._stds) + self._means
 
-                    if self.scale_normal:
+                    if self._scale_normal:
                         unscaled = (
-                            scaled * (self.maxs - self.mins)
-                        ) + self.mins
+                            scaled * (self._maxs - self._mins)
+                        ) + self._mins
 
                 else:
 
@@ -379,13 +389,15 @@ def inverse_transform(self, scaled, as_numpy=False):
                     # Total scaling
                     ##########################
 
-                    if self.scale_standard:
-                        unscaled = (scaled * self.total_std) + self.total_mean
+                    if self._scale_standard:
+                        unscaled = (
+                            scaled * self._total_std
+                        ) + self._total_mean
 
-                    if self.scale_normal:
+                    if self._scale_normal:
                         unscaled = (
-                            scaled * (self.total_max - self.total_min)
-                        ) + self.total_min
+                            scaled * (self._total_max - self._total_min)
+                        ) + self._total_min
         #
         if as_numpy:
             return unscaled.detach().numpy().astype(np.float64)
@@ -405,7 +417,7 @@ def save(self, filename, save_format="pickle"):
             File format which will be used for saving.
         """
         # If we use ddp, only save the network on root.
-        if self.use_ddp:
+        if self._use_ddp:
             if dist.get_rank() != 0:
                 return
         if save_format == "pickle":
diff --git a/test/all_lazy_loading_test.py b/test/all_lazy_loading_test.py
index 5130266a7..4e7661bff 100644
--- a/test/all_lazy_loading_test.py
+++ b/test/all_lazy_loading_test.py
@@ -110,34 +110,34 @@ def test_scaling(self):
                     # I presume to be due to numerical constraints. To make a
                     # meaningful comparison it is wise to scale the value here.
                     this_result.append(
-                        data_handler.input_data_scaler.total_mean
+                        data_handler.input_data_scaler._total_mean
                         / data_handler.nr_training_data
                     )
                     this_result.append(
-                        data_handler.input_data_scaler.total_std
+                        data_handler.input_data_scaler._total_std
                         / data_handler.nr_training_data
                     )
                     this_result.append(
-                        data_handler.output_data_scaler.total_mean
+                        data_handler.output_data_scaler._total_mean
                         / data_handler.nr_training_data
                     )
                     this_result.append(
-                        data_handler.output_data_scaler.total_std
+                        data_handler.output_data_scaler._total_std
                         / data_handler.nr_training_data
                     )
                 elif scalingtype == "normal":
                     torch.manual_seed(2002)
                     this_result.append(
-                        data_handler.input_data_scaler.total_max
+                        data_handler.input_data_scaler._total_max
                     )
                     this_result.append(
-                        data_handler.input_data_scaler.total_min
+                        data_handler.input_data_scaler._total_min
                     )
                     this_result.append(
-                        data_handler.output_data_scaler.total_max
+                        data_handler.output_data_scaler._total_max
                     )
                     this_result.append(
-                        data_handler.output_data_scaler.total_min
+                        data_handler.output_data_scaler._total_min
                     )
                     dataset_tester.append(
                         (data_handler.training_data_sets[0][3998])[0].sum()
@@ -165,41 +165,41 @@ def test_scaling(self):
                     # I presume to be due to numerical constraints. To make a
                     # meaningful comparison it is wise to scale the value here.
                     this_result.append(
-                        torch.mean(data_handler.input_data_scaler.means)
+                        torch.mean(data_handler.input_data_scaler._means)
                         / data_handler.parameters.snapshot_directories_list[
                             0
                         ].grid_size
                     )
                     this_result.append(
-                        torch.mean(data_handler.input_data_scaler.stds)
+                        torch.mean(data_handler.input_data_scaler._stds)
                         / data_handler.parameters.snapshot_directories_list[
                             0
                         ].grid_size
                     )
                     this_result.append(
-                        torch.mean(data_handler.output_data_scaler.means)
+                        torch.mean(data_handler.output_data_scaler._means)
                         / data_handler.parameters.snapshot_directories_list[
                             0
                         ].grid_size
                     )
                     this_result.append(
-                        torch.mean(data_handler.output_data_scaler.stds)
+                        torch.mean(data_handler.output_data_scaler._stds)
                         / data_handler.parameters.snapshot_directories_list[
                             0
                         ].grid_size
                     )
                 elif scalingtype == "feature-wise-normal":
                     this_result.append(
-                        torch.mean(data_handler.input_data_scaler.maxs)
+                        torch.mean(data_handler.input_data_scaler._maxs)
                     )
                     this_result.append(
-                        torch.mean(data_handler.input_data_scaler.mins)
+                        torch.mean(data_handler.input_data_scaler._mins)
                     )
                     this_result.append(
-                        torch.mean(data_handler.output_data_scaler.maxs)
+                        torch.mean(data_handler.output_data_scaler._maxs)
                     )
                     this_result.append(
-                        torch.mean(data_handler.output_data_scaler.mins)
+                        torch.mean(data_handler.output_data_scaler._mins)
                     )
 
                 comparison.append(this_result)

From c84b314cd24f16c71f315efc9d4e838c768950d7 Mon Sep 17 00:00:00 2001
From: Lenz Fiedler <l.fiedler@hzdr.de>
Date: Fri, 22 Nov 2024 17:00:02 +0100
Subject: [PATCH 09/21] Some more data handling classes done

---
 mala/datahandling/data_shuffler.py       |  16 ++--
 mala/datahandling/fast_tensor_dataset.py |  28 ++++--
 mala/datahandling/lazy_load_dataset.py   | 116 ++++++++++++-----------
 3 files changed, 91 insertions(+), 69 deletions(-)

diff --git a/mala/datahandling/data_shuffler.py b/mala/datahandling/data_shuffler.py
index c3f71644f..9303b0ee7 100644
--- a/mala/datahandling/data_shuffler.py
+++ b/mala/datahandling/data_shuffler.py
@@ -53,7 +53,7 @@ def __init__(
             self.descriptor_calculator.parameters.descriptors_contain_xyz = (
                 False
             )
-        self.data_points_to_remove = None
+        self._data_points_to_remove = None
 
     def add_snapshot(
         self,
@@ -135,8 +135,8 @@ def __shuffle_numpy(
             # then we have to trim the original snapshots to size
             # the indicies to be removed are selected at random
             if (
-                self.data_points_to_remove is not None
-                and np.sum(self.data_points_to_remove) > 0
+                self._data_points_to_remove is not None
+                and np.sum(self._data_points_to_remove) > 0
             ):
                 if self.parameters.shuffling_seed is not None:
                     np.random.seed(idx * self.parameters.shuffling_seed)
@@ -155,7 +155,7 @@ def __shuffle_numpy(
 
                 indices = np.random.choice(
                     ngrid,
-                    size=ngrid - self.data_points_to_remove[idx],
+                    size=ngrid - self._data_points_to_remove[idx],
                 )
 
                 descriptor_data[idx] = current_descriptor[indices]
@@ -548,7 +548,7 @@ def shuffle_snapshots(
             ]
         )
         number_of_data_points = np.sum(snapshot_size_list)
-        self.data_points_to_remove = None
+        self._data_points_to_remove = None
         if number_of_shuffled_snapshots is None:
             number_of_shuffled_snapshots = self.nr_snapshots
 
@@ -584,13 +584,13 @@ def shuffle_snapshots(
                 np.sum(shuffled_gridsizes) * number_of_shuffled_snapshots
             )
 
-        self.data_points_to_remove = []
+        self._data_points_to_remove = []
         for i in range(0, self.nr_snapshots):
-            self.data_points_to_remove.append(
+            self._data_points_to_remove.append(
                 snapshot_size_list[i]
                 - shuffled_gridsizes[i] * number_of_shuffled_snapshots
             )
-        tot_points_missing = sum(self.data_points_to_remove)
+        tot_points_missing = sum(self._data_points_to_remove)
 
         if tot_points_missing > 0:
             printout(
diff --git a/mala/datahandling/fast_tensor_dataset.py b/mala/datahandling/fast_tensor_dataset.py
index 6b38477d5..0f650b56a 100644
--- a/mala/datahandling/fast_tensor_dataset.py
+++ b/mala/datahandling/fast_tensor_dataset.py
@@ -10,15 +10,29 @@ class FastTensorDataset(torch.utils.data.Dataset):
 
     This version of TensorDataset gathers data using a single call
     within  __getitem__. A bit more tricky to manage but is faster still.
+
+    Parameters
+    ----------
+    batch_size : int
+        Batch size to be used with this data set.
+
+    tensors : object
+        Torch tensors for this data set.
+
+    Attributes
+    ----------
+    batch_size : int
+        Batch size to be used with this data set.
     """
 
     def __init__(self, batch_size, *tensors):
+        """ """
         super(FastTensorDataset).__init__()
         self.batch_size = batch_size
-        self.tensors = tensors
+        self._tensors = tensors
         total_samples = tensors[0].shape[0]
-        self.indices = np.arange(total_samples)
-        self.len = total_samples // self.batch_size
+        self._indices = np.arange(total_samples)
+        self._len = total_samples // self.batch_size
 
     def __getitem__(self, idx):
         """
@@ -36,16 +50,16 @@ def __getitem__(self, idx):
         batch : tuple
             The data tuple for this batch.
         """
-        batch = self.indices[
+        batch = self._indices[
             idx * self.batch_size : (idx + 1) * self.batch_size
         ]
-        rv = tuple(t[batch, ...] for t in self.tensors)
+        rv = tuple(t[batch, ...] for t in self._tensors)
         return rv
 
     def __len__(self):
         """Get the length of the data set."""
-        return self.len
+        return self._len
 
     def shuffle(self):
         """Shuffle the data set."""
-        np.random.shuffle(self.indices)
+        np.random.shuffle(self._indices)
diff --git a/mala/datahandling/lazy_load_dataset.py b/mala/datahandling/lazy_load_dataset.py
index 00810beb3..a5a2b1a50 100644
--- a/mala/datahandling/lazy_load_dataset.py
+++ b/mala/datahandling/lazy_load_dataset.py
@@ -48,6 +48,17 @@ class LazyLoadDataset(Dataset):
 
     input_requires_grad : bool
         If True, then the gradient is stored for the inputs.
+
+    Attributes
+    ----------
+    currently_loaded_file : int
+        Index of currently loaded file.
+
+    input_data : torch.Tensor
+        Input data tensor.
+
+    output_data : torch.Tensor
+        Output data tensor.
     """
 
     def __init__(
@@ -62,25 +73,22 @@ def __init__(
         device,
         input_requires_grad=False,
     ):
-        self.snapshot_list = []
-        self.input_dimension = input_dimension
-        self.output_dimension = output_dimension
-        self.input_data_scaler = input_data_scaler
-        self.output_data_scaler = output_data_scaler
-        self.descriptor_calculator = descriptor_calculator
-        self.target_calculator = target_calculator
-        self.number_of_snapshots = 0
-        self.total_size = 0
-        self.descriptors_contain_xyz = (
-            self.descriptor_calculator.descriptors_contain_xyz
-        )
+        self._snapshot_list = []
+        self._input_dimension = input_dimension
+        self._output_dimension = output_dimension
+        self._input_data_scaler = input_data_scaler
+        self._output_data_scaler = output_data_scaler
+        self._descriptor_calculator = descriptor_calculator
+        self._target_calculator = target_calculator
+        self._number_of_snapshots = 0
+        self._total_size = 0
         self.currently_loaded_file = None
         self.input_data = np.empty(0)
         self.output_data = np.empty(0)
-        self.use_ddp = use_ddp
+        self._use_ddp = use_ddp
         self.return_outputs_directly = False
-        self.input_requires_grad = input_requires_grad
-        self.device = device
+        self._input_requires_grad = input_requires_grad
+        self._device = device
 
     @property
     def return_outputs_directly(self):
@@ -108,9 +116,9 @@ def add_snapshot_to_dataset(self, snapshot: Snapshot):
             Snapshot that is to be added to this DataSet.
 
         """
-        self.snapshot_list.append(snapshot)
-        self.number_of_snapshots += 1
-        self.total_size += snapshot.grid_size
+        self._snapshot_list.append(snapshot)
+        self._number_of_snapshots += 1
+        self._total_size += snapshot.grid_size
 
     def mix_datasets(self):
         """
@@ -118,16 +126,16 @@ def mix_datasets(self):
 
         With this, there can be some variance between runs.
         """
-        used_perm = torch.randperm(self.number_of_snapshots)
+        used_perm = torch.randperm(self._number_of_snapshots)
         barrier()
-        if self.use_ddp:
-            used_perm = used_perm.to(device=self.device)
+        if self._use_ddp:
+            used_perm = used_perm.to(device=self._device)
             dist.broadcast(used_perm, 0)
-            self.snapshot_list = [
-                self.snapshot_list[i] for i in used_perm.to("cpu")
+            self._snapshot_list = [
+                self._snapshot_list[i] for i in used_perm.to("cpu")
             ]
         else:
-            self.snapshot_list = [self.snapshot_list[i] for i in used_perm]
+            self._snapshot_list = [self._snapshot_list[i] for i in used_perm]
         self.get_new_data(0)
 
     def get_new_data(self, file_index):
@@ -140,50 +148,50 @@ def get_new_data(self, file_index):
             File to be read.
         """
         # Load the data into RAM.
-        if self.snapshot_list[file_index].snapshot_type == "numpy":
-            self.input_data = self.descriptor_calculator.read_from_numpy_file(
+        if self._snapshot_list[file_index].snapshot_type == "numpy":
+            self.input_data = self._descriptor_calculator.read_from_numpy_file(
                 os.path.join(
-                    self.snapshot_list[file_index].input_npy_directory,
-                    self.snapshot_list[file_index].input_npy_file,
+                    self._snapshot_list[file_index].input_npy_directory,
+                    self._snapshot_list[file_index].input_npy_file,
                 ),
-                units=self.snapshot_list[file_index].input_units,
+                units=self._snapshot_list[file_index].input_units,
             )
-            self.output_data = self.target_calculator.read_from_numpy_file(
+            self.output_data = self._target_calculator.read_from_numpy_file(
                 os.path.join(
-                    self.snapshot_list[file_index].output_npy_directory,
-                    self.snapshot_list[file_index].output_npy_file,
+                    self._snapshot_list[file_index].output_npy_directory,
+                    self._snapshot_list[file_index].output_npy_file,
                 ),
-                units=self.snapshot_list[file_index].output_units,
+                units=self._snapshot_list[file_index].output_units,
             )
 
-        elif self.snapshot_list[file_index].snapshot_type == "openpmd":
+        elif self._snapshot_list[file_index].snapshot_type == "openpmd":
             self.input_data = (
-                self.descriptor_calculator.read_from_openpmd_file(
+                self._descriptor_calculator.read_from_openpmd_file(
                     os.path.join(
-                        self.snapshot_list[file_index].input_npy_directory,
-                        self.snapshot_list[file_index].input_npy_file,
+                        self._snapshot_list[file_index].input_npy_directory,
+                        self._snapshot_list[file_index].input_npy_file,
                     )
                 )
             )
-            self.output_data = self.target_calculator.read_from_openpmd_file(
+            self.output_data = self._target_calculator.read_from_openpmd_file(
                 os.path.join(
-                    self.snapshot_list[file_index].output_npy_directory,
-                    self.snapshot_list[file_index].output_npy_file,
+                    self._snapshot_list[file_index].output_npy_directory,
+                    self._snapshot_list[file_index].output_npy_file,
                 )
             )
 
         # Transform the data.
         self.input_data = self.input_data.reshape(
-            [self.snapshot_list[file_index].grid_size, self.input_dimension]
+            [self._snapshot_list[file_index].grid_size, self._input_dimension]
         )
         if self.input_data.dtype != DEFAULT_NP_DATA_DTYPE:
             self.input_data = self.input_data.astype(DEFAULT_NP_DATA_DTYPE)
         self.input_data = torch.from_numpy(self.input_data).float()
-        self.input_data_scaler.transform(self.input_data)
-        self.input_data.requires_grad = self.input_requires_grad
+        self._input_data_scaler.transform(self.input_data)
+        self.input_data.requires_grad = self._input_requires_grad
 
         self.output_data = self.output_data.reshape(
-            [self.snapshot_list[file_index].grid_size, self.output_dimension]
+            [self._snapshot_list[file_index].grid_size, self._output_dimension]
         )
         if self.return_outputs_directly is False:
             self.output_data = np.array(self.output_data)
@@ -192,7 +200,7 @@ def get_new_data(self, file_index):
                     DEFAULT_NP_DATA_DTYPE
                 )
             self.output_data = torch.from_numpy(self.output_data).float()
-            self.output_data_scaler.transform(self.output_data)
+            self._output_data_scaler.transform(self.output_data)
 
         # Save which data we have currently loaded.
         self.currently_loaded_file = file_index
@@ -201,28 +209,28 @@ def _get_file_index(self, idx, is_slice=False, is_start=False):
         file_index = None
         index_in_file = idx
         if is_slice:
-            for i in range(len(self.snapshot_list)):
-                if index_in_file - self.snapshot_list[i].grid_size <= 0:
+            for i in range(len(self._snapshot_list)):
+                if index_in_file - self._snapshot_list[i].grid_size <= 0:
                     file_index = i
 
                     # From the end of previous file to beginning of new.
                     if (
-                        index_in_file == self.snapshot_list[i].grid_size
+                        index_in_file == self._snapshot_list[i].grid_size
                         and is_start
                     ):
                         file_index = i + 1
                         index_in_file = 0
                     break
                 else:
-                    index_in_file -= self.snapshot_list[i].grid_size
+                    index_in_file -= self._snapshot_list[i].grid_size
             return file_index, index_in_file
         else:
-            for i in range(len(self.snapshot_list)):
-                if index_in_file - self.snapshot_list[i].grid_size < 0:
+            for i in range(len(self._snapshot_list)):
+                if index_in_file - self._snapshot_list[i].grid_size < 0:
                     file_index = i
                     break
                 else:
-                    index_in_file -= self.snapshot_list[i].grid_size
+                    index_in_file -= self._snapshot_list[i].grid_size
             return file_index, index_in_file
 
     def __getitem__(self, idx):
@@ -266,7 +274,7 @@ def __getitem__(self, idx):
             # the stop index will point to the wrong file.
             if file_index_start != file_index_stop:
                 if index_in_file_stop == 0:
-                    index_in_file_stop = self.snapshot_list[
+                    index_in_file_stop = self._snapshot_list[
                         file_index_stop
                     ].grid_size
                 else:
@@ -297,4 +305,4 @@ def __len__(self):
         length : int
             Number of data points in DataSet.
         """
-        return self.total_size
+        return self._total_size

From 259d3ed16be10af209adcac86bcd95c9c0678514 Mon Sep 17 00:00:00 2001
From: Lenz Fiedler <l.fiedler@hzdr.de>
Date: Fri, 22 Nov 2024 17:28:08 +0100
Subject: [PATCH 10/21] Finished with data handling

---
 mala/datahandling/lazy_load_dataset_single.py | 97 ++++++++++++++-----
 mala/datahandling/ldos_aligner.py             | 33 +++----
 .../multi_lazy_load_data_loader.py            | 42 ++++----
 mala/datahandling/snapshot.py                 | 54 ++++++++++-
 mala/network/objective_base.py                |  3 +-
 mala/network/runner.py                        |  2 +-
 6 files changed, 164 insertions(+), 67 deletions(-)

diff --git a/mala/datahandling/lazy_load_dataset_single.py b/mala/datahandling/lazy_load_dataset_single.py
index 33d7fee87..402d149de 100644
--- a/mala/datahandling/lazy_load_dataset_single.py
+++ b/mala/datahandling/lazy_load_dataset_single.py
@@ -44,6 +44,56 @@ class LazyLoadDatasetSingle(Dataset):
 
     input_requires_grad : bool
         If True, then the gradient is stored for the inputs.
+
+    Attributes
+    ----------
+    allocated : bool
+        True if dataset is allocated.
+
+    currently_loaded_file : int
+        Index of currently loaded file
+
+    descriptor_calculator : mala.descriptors.descriptor.Descriptor
+        Used to do unit conversion on input data.
+
+    input_data : torch.Tensor
+        Input data tensor.
+
+    input_dtype : numpy.dtype
+        Input data type.
+
+    input_shape : list
+        Input data dimensions
+
+    input_shm_name : str
+        Name of shared memory allocated for input data
+
+    loaded : bool
+        True if data has been loaded to shared memory.
+
+    output_data : torch.Tensor
+        Output data tensor.
+
+    output_dtype : numpy.dtype
+        Output data dtype.
+
+    output_shape : list
+        Output data dimensions.
+
+    output_shm_name : str
+        Name of shared memory allocated for output data.
+
+    return_outputs_directly : bool
+
+        Control whether outputs are actually transformed.
+        Has to be False for training. In the testing case,
+        Numerical errors are smaller if set to True.
+
+    snapshot : mala.datahandling.snapshot.Snapshot
+        Currently loaded snapshot object.
+
+    target_calculator : mala.targets.target.Target or derivative
+        Used to do unit conversion on output data.
     """
 
     def __init__(
@@ -60,27 +110,24 @@ def __init__(
         input_requires_grad=False,
     ):
         self.snapshot = snapshot
-        self.input_dimension = input_dimension
-        self.output_dimension = output_dimension
-        self.input_data_scaler = input_data_scaler
-        self.output_data_scaler = output_data_scaler
+        self._input_dimension = input_dimension
+        self._output_dimension = output_dimension
+        self._input_data_scaler = input_data_scaler
+        self._output_data_scaler = output_data_scaler
         self.descriptor_calculator = descriptor_calculator
         self.target_calculator = target_calculator
-        self.number_of_snapshots = 0
-        self.total_size = 0
-        self.descriptors_contain_xyz = (
-            self.descriptor_calculator.descriptors_contain_xyz
-        )
+        self._number_of_snapshots = 0
+        self._total_size = 0
         self.currently_loaded_file = None
         self.input_data = np.empty(0)
         self.output_data = np.empty(0)
-        self.use_ddp = use_ddp
+        self._use_ddp = use_ddp
         self.return_outputs_directly = False
-        self.input_requires_grad = input_requires_grad
+        self._input_requires_grad = input_requires_grad
 
-        self.batch_size = batch_size
-        self.len = int(np.ceil(snapshot.grid_size / self.batch_size))
-        self.indices = np.arange(snapshot.grid_size)
+        self._batch_size = batch_size
+        self._len = int(np.ceil(snapshot.grid_size / self._batch_size))
+        self._indices = np.arange(snapshot.grid_size)
         self.input_shm_name = None
         self.output_shm_name = None
         self.loaded = False
@@ -197,20 +244,20 @@ def __getitem__(self, idx):
         output_shm = shared_memory.SharedMemory(name=self.output_shm_name)
 
         input_data = np.ndarray(
-            shape=[self.snapshot.grid_size, self.input_dimension],
+            shape=[self.snapshot.grid_size, self._input_dimension],
             dtype=np.float32,
             buffer=input_shm.buf,
         )
         output_data = np.ndarray(
-            shape=[self.snapshot.grid_size, self.output_dimension],
+            shape=[self.snapshot.grid_size, self._output_dimension],
             dtype=np.float32,
             buffer=output_shm.buf,
         )
-        if idx == self.len - 1:
-            batch = self.indices[idx * self.batch_size :]
+        if idx == self._len - 1:
+            batch = self._indices[idx * self._batch_size :]
         else:
-            batch = self.indices[
-                idx * self.batch_size : (idx + 1) * self.batch_size
+            batch = self._indices[
+                idx * self._batch_size : (idx + 1) * self._batch_size
             ]
         # print(batch.shape)
 
@@ -219,12 +266,12 @@ def __getitem__(self, idx):
 
         # Perform conversion to tensor and perform transforms
         input_batch = torch.from_numpy(input_batch)
-        self.input_data_scaler.transform(input_batch)
-        input_batch.requires_grad = self.input_requires_grad
+        self._input_data_scaler.transform(input_batch)
+        input_batch.requires_grad = self._input_requires_grad
 
         if self.return_outputs_directly is False:
             output_batch = torch.from_numpy(output_batch)
-            self.output_data_scaler.transform(output_batch)
+            self._output_data_scaler.transform(output_batch)
 
         input_shm.close()
         output_shm.close()
@@ -240,7 +287,7 @@ def __len__(self):
         length : int
             Number of data points in DataSet.
         """
-        return self.len
+        return self._len
 
     def mix_datasets(self):
         """
@@ -257,4 +304,4 @@ def mix_datasets(self):
         avoid erroneously overwriting shared memory data in cases where a
         single dataset object is used back to back.
         """
-        np.random.shuffle(self.indices)
+        np.random.shuffle(self._indices)
diff --git a/mala/datahandling/ldos_aligner.py b/mala/datahandling/ldos_aligner.py
index 892a94fbf..acc712094 100644
--- a/mala/datahandling/ldos_aligner.py
+++ b/mala/datahandling/ldos_aligner.py
@@ -33,6 +33,11 @@ class LDOSAligner(DataHandlerBase):
     target_calculator : mala.targets.target.Target
         Used to do unit conversion on output data. If None, then one will
         be created by this class.
+
+    Attributes
+    ----------
+    ldos_parameters : mala.common.parameters.ParametersTargets
+        MALA target calculation parameters.
     """
 
     def __init__(
@@ -85,8 +90,6 @@ def add_snapshot(
 
     def align_ldos_to_ref(
         self,
-        save_path=None,
-        save_name=None,
         save_path_ext="aligned/",
         reference_index=0,
         zero_tol=1e-5,
@@ -96,35 +99,34 @@ def align_ldos_to_ref(
         n_shift_mse=None,
     ):
         """
-        Add a snapshot to the data pipeline.
+        Align LDOS to reference.
 
         Parameters
         ----------
-        save_path : string
-            path to save the aligned LDOS vectors
-        save_name : string
-            naming convention for the aligned LDOS vectors
         save_path_ext : string
-            additional path for the LDOS vectors (useful if
-            save_path is left as default None)
+            Extra path to be added to the input path before saving.
+            By default, new snapshot files are saved into exactly the
+            same directory they were read from with exactly the same name.
+
         reference_index : int
             the snapshot number (in the snapshot directory list)
             to which all other LDOS vectors are aligned
+
         zero_tol : float
             the "zero" value for alignment / left side truncation
             always scaled by norm of reference LDOS mean
+
         left_truncate : bool
             whether to truncate the zero values on the LHS
+
         right_truncate_value : float
             right-hand energy value (based on reference LDOS vector)
             to which truncate LDOS vectors
             if None, no right-side truncation
-        egrid_spacing_ev : float
-            spacing of energy grid
-        egrid_offset_ev : float
-           original offset of energy grid
+
         number_of_electrons : float / int
             if not None, computes the energy shift relative to QE energies
+
         n_shift_mse : int
             how many energy grid points to consider when aligning LDOS
             vectors based on mean-squared error
@@ -304,10 +306,9 @@ def align_ldos_to_ref(
                 json.dump(ldos_shift_info, f, indent=2)
 
         barrier()
-    
+
     @staticmethod
     def calc_optimal_ldos_shift(
-        e_grid,
         ldos_mean,
         ldos_mean_ref,
         left_index,
@@ -322,8 +323,6 @@ def calc_optimal_ldos_shift(
 
         Parameters
         ----------
-        e_grid : array_like
-            energy grid
         ldos_mean : array_like
             mean of LDOS vector for shifting
         ldos_mean_ref : array_like
diff --git a/mala/datahandling/multi_lazy_load_data_loader.py b/mala/datahandling/multi_lazy_load_data_loader.py
index ed0154e32..a9aca6afc 100644
--- a/mala/datahandling/multi_lazy_load_data_loader.py
+++ b/mala/datahandling/multi_lazy_load_data_loader.py
@@ -20,23 +20,23 @@ class MultiLazyLoadDataLoader:
     """
 
     def __init__(self, datasets, **kwargs):
-        self.datasets = datasets
-        self.loaders = []
+        self._datasets = datasets
+        self._loaders = []
         for d in datasets:
-            self.loaders.append(
+            self._loaders.append(
                 DataLoader(d, batch_size=None, **kwargs, shuffle=False)
             )
 
         # Create single process pool for prefetching
         # Can use ThreadPoolExecutor for debugging.
         # self.pool = concurrent.futures.ThreadPoolExecutor(1)
-        self.pool = concurrent.futures.ProcessPoolExecutor(1)
+        self._pool = concurrent.futures.ProcessPoolExecutor(1)
 
         # Allocate shared memory and commence file load for first
         # dataset in list
-        dset = self.datasets[0]
+        dset = self._datasets[0]
         dset.allocate_shared_mem()
-        self.load_future = self.pool.submit(
+        self._load_future = self._pool.submit(
             self.load_snapshot_to_shm,
             dset.snapshot,
             dset.descriptor_calculator,
@@ -54,7 +54,7 @@ def __len__(self):
         length : int
             Number of datasets/snapshots contained within this loader.
         """
-        return len(self.loaders)
+        return len(self._loaders)
 
     def __iter__(self):
         """
@@ -66,7 +66,7 @@ def __iter__(self):
             An iterator over the individual datasets/snapshots in this
             object.
         """
-        self.count = 0
+        self._count = 0
         return self
 
     def __next__(self):
@@ -78,25 +78,25 @@ def __next__(self):
         iterator: DataLoader
             The next data loader.
         """
-        self.count += 1
-        if self.count > len(self.loaders):
+        self._count += 1
+        if self._count > len(self._loaders):
             raise StopIteration
         else:
             # Wait on last prefetch
-            if self.count - 1 >= 0:
-                if not self.datasets[self.count - 1].loaded:
-                    self.load_future.result()
-                    self.datasets[self.count - 1].loaded = True
+            if self._count - 1 >= 0:
+                if not self._datasets[self._count - 1].loaded:
+                    self._load_future.result()
+                    self._datasets[self._count - 1].loaded = True
 
             # Delete last
-            if self.count - 2 >= 0:
-                self.datasets[self.count - 2].delete_data()
+            if self._count - 2 >= 0:
+                self._datasets[self._count - 2].delete_data()
 
             # Prefetch next file (looping around epoch boundary)
-            dset = self.datasets[self.count % len(self.loaders)]
+            dset = self._datasets[self._count % len(self._loaders)]
             if not dset.loaded:
                 dset.allocate_shared_mem()
-                self.load_future = self.pool.submit(
+                self._load_future = self._pool.submit(
                     self.load_snapshot_to_shm,
                     dset.snapshot,
                     dset.descriptor_calculator,
@@ -106,7 +106,7 @@ def __next__(self):
                 )
 
             # Return current
-            return self.loaders[self.count - 1]
+            return self._loaders[self._count - 1]
 
     # TODO: Without this function, I get 2 times the number of snapshots
     # memory leaks after shutdown. With it, I get 1 times the number of
@@ -114,9 +114,9 @@ def __next__(self):
     # enough? I am not sure where the memory leak is coming from.
     def cleanup(self):
         """Deallocate arrays still left in memory."""
-        for dset in self.datasets:
+        for dset in self._datasets:
             dset.deallocate_shared_mem()
-        self.pool.shutdown()
+        self._pool.shutdown()
 
     # Worker function to load data into shared memory (limited to numpy files
     # only for now)
diff --git a/mala/datahandling/snapshot.py b/mala/datahandling/snapshot.py
index 8f6bc4666..0385da478 100644
--- a/mala/datahandling/snapshot.py
+++ b/mala/datahandling/snapshot.py
@@ -43,8 +43,58 @@ class Snapshot(JSONSerializable):
           - tr: This snapshot will be a training snapshot.
           - va: This snapshot will be a validation snapshot.
 
-        Replaces the old approach of MALA to have a separate list.
-        Default is None.
+    Attributes
+    ----------
+    calculation_output : string
+        File with the output of the original snapshot calculation. This is
+        only needed when testing multiple snapshots.
+
+    grid_dimensions :  list
+        Grid dimension [x,y,z].
+
+    grid_size : int
+        Number of grid points in total.
+
+    input_dimension : int
+        Input feature dimension.
+
+    output_dimension : int
+        Output feature dimension
+
+    input_npy_file : string
+        File with saved numpy input array.
+
+    input_npy_directory : string
+        Directory containing input_npy_directory.
+
+    output_npy_file : string
+        File with saved numpy output array.
+
+    output_npy_directory : string
+        Directory containing output_npy_file.
+
+    input_units : string
+        Units of input data. See descriptor classes to see which units are
+        supported.
+
+    output_units : string
+        Units of output data. See target classes to see which units are
+        supported.
+
+    calculation_output : string
+        File with the output of the original snapshot calculation. This is
+        only needed when testing multiple snapshots.
+
+    snapshot_function : string
+        "Function" of the snapshot in the MALA workflow.
+
+          - te: This snapshot will be a testing snapshot.
+          - tr: This snapshot will be a training snapshot.
+          - va: This snapshot will be a validation snapshot.
+
+    snapshot_type : string
+        Can be either "numpy" or "openpmd" and denotes which type of files
+        this snapshot contains.
     """
 
     def __init__(
diff --git a/mala/network/objective_base.py b/mala/network/objective_base.py
index 2fbf29503..c90916935 100644
--- a/mala/network/objective_base.py
+++ b/mala/network/objective_base.py
@@ -7,6 +7,7 @@
 from mala.network.hyperparameter_oat import HyperparameterOAT
 from mala.network.network import Network
 from mala.network.trainer import Trainer
+from mala.common.parameters import Parameters
 from mala import printout
 
 
@@ -29,7 +30,7 @@ def __init__(self, params, data_handler):
         data_handler : mala.datahandling.data_handler.DataHandler
             datahandler to be used during the hyperparameter optimization.
         """
-        self.params = params
+        self.params: Parameters = params
         self.data_handler = data_handler
 
         # We need to find out if we have to reparametrize the lists with the
diff --git a/mala/network/runner.py b/mala/network/runner.py
index 7d3d2ffa8..9daf32f6a 100644
--- a/mala/network/runner.py
+++ b/mala/network/runner.py
@@ -46,7 +46,7 @@ def __init__(self, params, network, data, runner_dict=None):
         self.parameters_full: Parameters = params
         self.parameters: ParametersRunning = params.running
         self.network = network
-        self.data = data
+        self.data: DataHandler = data
         self.__prepare_to_run()
 
     def _calculate_errors(

From 8557bb2bd1afc5a2b438952f7a5812505c6e0573 Mon Sep 17 00:00:00 2001
From: Lenz Fiedler <l.fiedler@hzdr.de>
Date: Fri, 22 Nov 2024 18:31:30 +0100
Subject: [PATCH 11/21] Finished with descriptors

---
 .../advanced/ex10_convert_numpy_openpmd.py    |   8 +-
 mala/datahandling/data_scaler.py              | 285 ++++++++++--------
 mala/descriptors/atomic_density.py            |  22 +-
 mala/descriptors/bispectrum.py                |  64 ++--
 mala/descriptors/descriptor.py                | 140 +++++----
 mala/descriptors/minterpy_descriptors.py      |  24 +-
 mala/network/predictor.py                     |   2 +-
 test/all_lazy_loading_test.py                 |  32 +-
 test/complete_interfaces_test.py              |  14 +-
 9 files changed, 316 insertions(+), 275 deletions(-)

diff --git a/examples/advanced/ex10_convert_numpy_openpmd.py b/examples/advanced/ex10_convert_numpy_openpmd.py
index 45369ff89..7ebc22daa 100644
--- a/examples/advanced/ex10_convert_numpy_openpmd.py
+++ b/examples/advanced/ex10_convert_numpy_openpmd.py
@@ -29,7 +29,7 @@
     descriptor_save_path="./",
     target_save_path="./",
     additional_info_save_path="./",
-    naming_scheme="converted_from_numpy_*.bp5",
+    naming_scheme="converted_from_numpy_*.h5",
     descriptor_calculation_kwargs={"working_directory": "./"},
 )
 
@@ -40,11 +40,9 @@
 for snapshot in range(2):
     data_converter.add_snapshot(
         descriptor_input_type="openpmd",
-        descriptor_input_path="converted_from_numpy_{}.in.bp5".format(
-            snapshot
-        ),
+        descriptor_input_path="converted_from_numpy_{}.in.h5".format(snapshot),
         target_input_type="openpmd",
-        target_input_path="converted_from_numpy_{}.out.bp5".format(snapshot),
+        target_input_path="converted_from_numpy_{}.out.h5".format(snapshot),
         additional_info_input_type=None,
         additional_info_input_path=None,
         target_units=None,
diff --git a/mala/datahandling/data_scaler.py b/mala/datahandling/data_scaler.py
index 3ecf39881..ffabcf56e 100644
--- a/mala/datahandling/data_scaler.py
+++ b/mala/datahandling/data_scaler.py
@@ -37,45 +37,87 @@ class DataScaler:
     ----------
     cantransform : bool
         If True, this scaler is set up to perform scaling.
+
+    feature_wise : bool
+        (Managed internally, not set to private due to legacy issues)
+
+    maxs : torch.Tensor
+        (Managed internally, not set to private due to legacy issues)
+
+    means : torch.Tensor
+        (Managed internally, not set to private due to legacy issues)
+
+    mins : torch.Tensor
+        (Managed internally, not set to private due to legacy issues)
+
+    scale_normal : bool
+        (Managed internally, not set to private due to legacy issues)
+
+    scale_standard : bool
+        (Managed internally, not set to private due to legacy issues)
+
+    stds : torch.Tensor
+        (Managed internally, not set to private due to legacy issues)
+
+    total_data_count : int
+        (Managed internally, not set to private due to legacy issues)
+
+    total_max : float
+        (Managed internally, not set to private due to legacy issues)
+
+    total_mean : float
+        (Managed internally, not set to private due to legacy issues)
+
+    total_min : float
+        (Managed internally, not set to private due to legacy issues)
+
+    total_std : float
+        (Managed internally, not set to private due to legacy issues)
+
+    typestring : str
+        (Managed internally, not set to private due to legacy issues)
+
+    use_ddp : bool
+        (Managed internally, not set to private due to legacy issues)
     """
 
     def __init__(self, typestring, use_ddp=False):
-        self._use_ddp = use_ddp
-        self._typestring = typestring
-        self._scale_standard = False
-        self._scale_normal = False
-        self._feature_wise = False
+        self.use_ddp = use_ddp
+        self.typestring = typestring
+        self.scale_standard = False
+        self.scale_normal = False
+        self.feature_wise = False
         self.cantransform = False
         self.__parse_typestring()
 
-        self._means = torch.empty(0)
-        self._stds = torch.empty(0)
-        self._maxs = torch.empty(0)
-        self._mins = torch.empty(0)
-        self._total_mean = torch.tensor(0)
-        self._total_std = torch.tensor(0)
-        self._total_max = torch.tensor(float("-inf"))
-        self._total_min = torch.tensor(float("inf"))
+        self.means = torch.empty(0)
+        self.stds = torch.empty(0)
+        self.maxs = torch.empty(0)
+        self.mins = torch.empty(0)
+        self.total_mean = torch.tensor(0)
+        self.total_std = torch.tensor(0)
+        self.total_max = torch.tensor(float("-inf"))
+        self.total_min = torch.tensor(float("inf"))
 
-        self._total_data_count = 0
+        self.total_data_count = 0
 
     def __parse_typestring(self):
         """Parse the typestring to class attributes."""
-        self._scale_standard = False
-        self._scale_normal = False
-        self._feature_wise = False
-
-        if "standard" in self._typestring:
-            self._scale_standard = True
-        if "normal" in self._typestring:
-            self._scale_normal = True
-        if "feature-wise" in self._typestring:
-            self._feature_wise = True
-        if self._scale_standard is False and self._scale_normal is False:
+        self.scale_standard = False
+        self.scale_normal = False
+        self.feature_wise = False
+
+        if "standard" in self.typestring:
+            self.scale_standard = True
+        if "normal" in self.typestring:
+            self.scale_normal = True
+        if "feature-wise" in self.typestring:
+            self.feature_wise = True
+        if self.scale_standard is False and self.scale_normal is False:
             printout("No data rescaling will be performed.", min_verbosity=1)
             self.cantransform = True
             return
-        if self._scale_standard is True and self._scale_normal is True:
+        if self.scale_standard is True and self.scale_normal is True:
             raise Exception("Invalid input data rescaling.")
 
     def start_incremental_fitting(self):
@@ -84,7 +126,7 @@ def start_incremental_fitting(self):
 
         This is necessary for lazy loading.
         """
-        self._total_data_count = 0
+        self.total_data_count = 0
 
     def incremental_fit(self, unscaled):
         """
@@ -98,71 +140,71 @@ def incremental_fit(self, unscaled):
             Data that is to be added to the fit.
 
         """
-        if self._scale_standard is False and self._scale_normal is False:
+        if self.scale_standard is False and self.scale_normal is False:
             return
         else:
             with torch.no_grad():
-                if self._feature_wise:
+                if self.feature_wise:
 
                     ##########################
                     # Feature-wise-scaling
                     ##########################
 
-                    if self._scale_standard:
+                    if self.scale_standard:
                         new_mean = torch.mean(unscaled, 0, keepdim=True)
                         new_std = torch.std(unscaled, 0, keepdim=True)
 
                         current_data_count = list(unscaled.size())[0]
 
-                        old_mean = self._means
-                        old_std = self._stds
+                        old_mean = self.means
+                        old_std = self.stds
 
-                        if list(self._means.size())[0] > 0:
-                            self._means = (
-                                self._total_data_count
-                                / (self._total_data_count + current_data_count)
+                        if list(self.means.size())[0] > 0:
+                            self.means = (
+                                self.total_data_count
+                                / (self.total_data_count + current_data_count)
                                 * old_mean
                                 + current_data_count
-                                / (self._total_data_count + current_data_count)
+                                / (self.total_data_count + current_data_count)
                                 * new_mean
                             )
                         else:
-                            self._means = new_mean
-                        if list(self._stds.size())[0] > 0:
-                            self._stds = (
-                                self._total_data_count
-                                / (self._total_data_count + current_data_count)
+                            self.means = new_mean
+                        if list(self.stds.size())[0] > 0:
+                            self.stds = (
+                                self.total_data_count
+                                / (self.total_data_count + current_data_count)
                                 * old_std**2
                                 + current_data_count
-                                / (self._total_data_count + current_data_count)
+                                / (self.total_data_count + current_data_count)
                                 * new_std**2
-                                + (self._total_data_count * current_data_count)
-                                / (self._total_data_count + current_data_count)
+                                + (self.total_data_count * current_data_count)
+                                / (self.total_data_count + current_data_count)
                                 ** 2
                                 * (old_mean - new_mean) ** 2
                             )
 
-                            self._stds = torch.sqrt(self._stds)
+                            self.stds = torch.sqrt(self.stds)
                         else:
-                            self._stds = new_std
-                        self._total_data_count += current_data_count
+                            self.stds = new_std
+                        self.total_data_count += current_data_count
 
-                    if self._scale_normal:
+                    if self.scale_normal:
                         new_maxs = torch.max(unscaled, 0, keepdim=True)
-                        if list(self._maxs.size())[0] > 0:
+                        if list(self.maxs.size())[0] > 0:
                             for i in range(list(new_maxs.values.size())[1]):
-                                if new_maxs.values[0, i] > self._maxs[i]:
-                                    self._maxs[i] = new_maxs.values[0, i]
+                                if new_maxs.values[0, i] > self.maxs[i]:
+                                    self.maxs[i] = new_maxs.values[0, i]
                         else:
-                            self._maxs = new_maxs.values[0, :]
+                            self.maxs = new_maxs.values[0, :]
 
                         new_mins = torch.min(unscaled, 0, keepdim=True)
-                        if list(self._mins.size())[0] > 0:
+                        if list(self.mins.size())[0] > 0:
                             for i in range(list(new_mins.values.size())[1]):
-                                if new_mins.values[0, i] < self._mins[i]:
-                                    self._mins[i] = new_mins.values[0, i]
+                                if new_mins.values[0, i] < self.mins[i]:
+                                    self.mins[i] = new_mins.values[0, i]
                         else:
-                            self._mins = new_mins.values[0, :]
+                            self.mins = new_mins.values[0, :]
 
                 else:
 
@@ -170,7 +212,7 @@ def incremental_fit(self, unscaled):
                     # Total scaling
                     ##########################
 
-                    if self._scale_standard:
+                    if self.scale_standard:
                         current_data_count = (
                             list(unscaled.size())[0] * list(unscaled.size())[1]
                         )
@@ -178,15 +220,15 @@ def incremental_fit(self, unscaled):
                         new_mean = torch.mean(unscaled)
                         new_std = torch.std(unscaled)
 
-                        old_mean = self._total_mean
-                        old_std = self._total_std
+                        old_mean = self.total_mean
+                        old_std = self.total_std
 
-                        self._total_mean = (
-                            self._total_data_count
-                            / (self._total_data_count + current_data_count)
+                        self.total_mean = (
+                            self.total_data_count
+                            / (self.total_data_count + current_data_count)
                             * old_mean
                             + current_data_count
-                            / (self._total_data_count + current_data_count)
+                            / (self.total_data_count + current_data_count)
                             * new_mean
                         )
 
@@ -195,30 +237,29 @@ def incremental_fit(self, unscaled):
                         # results.
                         # Maybe we should check it at some point .
                         # I think it is merely an issue of numerical accuracy.
-                        self._total_std = (
-                            self._total_data_count
-                            / (self._total_data_count + current_data_count)
+                        self.total_std = (
+                            self.total_data_count
+                            / (self.total_data_count + current_data_count)
                             * old_std**2
                             + current_data_count
-                            / (self._total_data_count + current_data_count)
+                            / (self.total_data_count + current_data_count)
                             * new_std**2
-                            + (self._total_data_count * current_data_count)
-                            / (self._total_data_count + current_data_count)
-                            ** 2
+                            + (self.total_data_count * current_data_count)
+                            / (self.total_data_count + current_data_count) ** 2
                             * (old_mean - new_mean) ** 2
                         )
 
-                        self._total_std = torch.sqrt(self._total_std)
-                        self._total_data_count += current_data_count
+                        self.total_std = torch.sqrt(self.total_std)
+                        self.total_data_count += current_data_count
 
-                    if self._scale_normal:
+                    if self.scale_normal:
                         new_max = torch.max(unscaled)
-                        if new_max > self._total_max:
-                            self._total_max = new_max
+                        if new_max > self.total_max:
+                            self.total_max = new_max
 
                         new_min = torch.min(unscaled)
-                        if new_min < self._total_min:
-                            self._total_min = new_min
+                        if new_min < self.total_min:
+                            self.total_min = new_min
 
     def finish_incremental_fitting(self):
         """
@@ -238,27 +279,23 @@ def fit(self, unscaled):
             Data that on which the scaling will be calculated.
 
         """
-        if self._scale_standard is False and self._scale_normal is False:
+        if self.scale_standard is False and self.scale_normal is False:
             return
         else:
             with torch.no_grad():
-                if self._feature_wise:
+                if self.feature_wise:
 
                     ##########################
                     # Feature-wise-scaling
                     ##########################
 
-                    if self._scale_standard:
-                        self._means = torch.mean(unscaled, 0, keepdim=True)
-                        self._stds = torch.std(unscaled, 0, keepdim=True)
+                    if self.scale_standard:
+                        self.means = torch.mean(unscaled, 0, keepdim=True)
+                        self.stds = torch.std(unscaled, 0, keepdim=True)
 
-                    if self._scale_normal:
-                        self._maxs = torch.max(
-                            unscaled, 0, keepdim=True
-                        ).values
-                        self._mins = torch.min(
-                            unscaled, 0, keepdim=True
-                        ).values
+                    if self.scale_normal:
+                        self.maxs = torch.max(unscaled, 0, keepdim=True).values
+                        self.mins = torch.min(unscaled, 0, keepdim=True).values
 
                 else:
 
@@ -266,13 +303,13 @@ def fit(self, unscaled):
                     # Total scaling
                     ##########################
 
-                    if self._scale_standard:
-                        self._total_mean = torch.mean(unscaled)
-                        self._total_std = torch.std(unscaled)
+                    if self.scale_standard:
+                        self.total_mean = torch.mean(unscaled)
+                        self.total_std = torch.std(unscaled)
 
-                    if self._scale_normal:
-                        self._total_max = torch.max(unscaled)
-                        self._total_min = torch.min(unscaled)
+                    if self.scale_normal:
+                        self.total_max = torch.max(unscaled)
+                        self.total_min = torch.min(unscaled)
 
         self.cantransform = True
 
@@ -294,7 +331,7 @@ def transform(self, unscaled):
             Scaled data.
         """
         # First we need to find out if we even have to do anything.
-        if self._scale_standard is False and self._scale_normal is False:
+        if self.scale_standard is False and self.scale_normal is False:
             pass
 
         elif self.cantransform is False:
@@ -306,19 +343,19 @@ def transform(self, unscaled):
         # Perform the actual scaling, but use no_grad to make sure
         # that the next couple of iterations stay untracked.
         with torch.no_grad():
-            if self._feature_wise:
+            if self.feature_wise:
 
                 ##########################
                 # Feature-wise-scaling
                 ##########################
 
-                if self._scale_standard:
-                    unscaled -= self._means
-                    unscaled /= self._stds
+                if self.scale_standard:
+                    unscaled -= self.means
+                    unscaled /= self.stds
 
-                if self._scale_normal:
-                    unscaled -= self._mins
-                    unscaled /= self._maxs - self._mins
+                if self.scale_normal:
+                    unscaled -= self.mins
+                    unscaled /= self.maxs - self.mins
 
             else:
 
@@ -326,13 +363,13 @@ def transform(self, unscaled):
                 # Total scaling
                 ##########################
 
-                if self._scale_standard:
-                    unscaled -= self._total_mean
-                    unscaled /= self._total_std
+                if self.scale_standard:
+                    unscaled -= self.total_mean
+                    unscaled /= self.total_std
 
-                if self._scale_normal:
-                    unscaled -= self._total_min
-                    unscaled /= self._total_max - self._total_min
+                if self.scale_normal:
+                    unscaled -= self.total_min
+                    unscaled /= self.total_max - self.total_min
 
     def inverse_transform(self, scaled, as_numpy=False):
         """
@@ -356,7 +393,7 @@ def inverse_transform(self, scaled, as_numpy=False):
 
         """
         # First we need to find out if we even have to do anything.
-        if self._scale_standard is False and self._scale_normal is False:
+        if self.scale_standard is False and self.scale_normal is False:
             unscaled = scaled
 
         else:
@@ -369,19 +406,19 @@ def inverse_transform(self, scaled, as_numpy=False):
             # Perform the actual scaling, but use no_grad to make sure
             # that the next couple of iterations stay untracked.
             with torch.no_grad():
-                if self._feature_wise:
+                if self.feature_wise:
 
                     ##########################
                     # Feature-wise-scaling
                     ##########################
 
-                    if self._scale_standard:
-                        unscaled = (scaled * self._stds) + self._means
+                    if self.scale_standard:
+                        unscaled = (scaled * self.stds) + self.means
 
-                    if self._scale_normal:
+                    if self.scale_normal:
                         unscaled = (
-                            scaled * (self._maxs - self._mins)
-                        ) + self._mins
+                            scaled * (self.maxs - self.mins)
+                        ) + self.mins
 
                 else:
 
@@ -389,15 +426,13 @@ def inverse_transform(self, scaled, as_numpy=False):
                     # Total scaling
                     ##########################
 
-                    if self._scale_standard:
-                        unscaled = (
-                            scaled * self._total_std
-                        ) + self._total_mean
+                    if self.scale_standard:
+                        unscaled = (scaled * self.total_std) + self.total_mean
 
-                    if self._scale_normal:
+                    if self.scale_normal:
                         unscaled = (
-                            scaled * (self._total_max - self._total_min)
-                        ) + self._total_min
+                            scaled * (self.total_max - self.total_min)
+                        ) + self.total_min
         #
         if as_numpy:
             return unscaled.detach().numpy().astype(np.float64)
@@ -417,7 +452,7 @@ def save(self, filename, save_format="pickle"):
             File format which will be used for saving.
         """
         # If we use ddp, only save the network on root.
-        if self._use_ddp:
+        if self.use_ddp:
             if dist.get_rank() != 0:
                 return
         if save_format == "pickle":
diff --git a/mala/descriptors/atomic_density.py b/mala/descriptors/atomic_density.py
index 6c5a7acac..4459c838b 100755
--- a/mala/descriptors/atomic_density.py
+++ b/mala/descriptors/atomic_density.py
@@ -31,18 +31,12 @@ class AtomicDensity(Descriptor):
 
     def __init__(self, parameters):
         super(AtomicDensity, self).__init__(parameters)
-        self.verbosity = parameters.verbosity
 
     @property
     def data_name(self):
         """Get a string that describes the target (for e.g. metadata)."""
         return "AtomicDensity"
 
-    @property
-    def feature_size(self):
-        """Get the feature dimension of this data."""
-        return self.fingerprint_length
-
     @staticmethod
     def convert_units(array, in_units="None"):
         """
@@ -140,7 +134,7 @@ def __calculate_lammps(self, outdir, **kwargs):
         self.setup_lammps_tmp_files("ggrid", outdir)
 
         ase.io.write(
-            self.lammps_temporary_input, self.atoms, format=lammps_format
+            self._lammps_temporary_input, self._atoms, format=lammps_format
         )
 
         nx = self.grid_dimensions[0]
@@ -151,7 +145,7 @@ def __calculate_lammps(self, outdir, **kwargs):
         if self.parameters.atomic_density_sigma is None:
             self.grid_dimensions = [nx, ny, nz]
             self.parameters.atomic_density_sigma = self.get_optimal_sigma(
-                self.voxel
+                self._voxel
             )
 
         # Create LAMMPS instance.
@@ -213,7 +207,7 @@ def __calculate_lammps(self, outdir, **kwargs):
             if return_directly:
                 return gaussian_descriptors_np
             else:
-                self.fingerprint_length = 4
+                self.feature_size = 4
                 return gaussian_descriptors_np, nrows_ggrid
         else:
             # Since the atomic density may be directly fed back into QE
@@ -238,10 +232,10 @@ def __calculate_lammps(self, outdir, **kwargs):
                     [2, 1, 0, 3]
                 )
                 if self.parameters.descriptors_contain_xyz:
-                    self.fingerprint_length = 4
+                    self.feature_size = 4
                     return gaussian_descriptors_np[:, :, :, 3:], nx * ny * nz
                 else:
-                    self.fingerprint_length = 1
+                    self.feature_size = 1
                     return gaussian_descriptors_np[:, :, :, 6:], nx * ny * nz
 
     def __calculate_python(self, **kwargs):
@@ -281,7 +275,7 @@ def __calculate_python(self, **kwargs):
         # This follows the implementation in the LAMMPS code.
         if self.parameters.atomic_density_sigma is None:
             self.parameters.atomic_density_sigma = self.get_optimal_sigma(
-                self.voxel
+                self._voxel
             )
         cutoff_squared = (
             self.parameters.atomic_density_cutoff
@@ -329,10 +323,10 @@ def __calculate_python(self, **kwargs):
                     )
 
         if self.parameters.descriptors_contain_xyz:
-            self.fingerprint_length = 4
+            self.feature_size = 4
             return gaussian_descriptors_np, np.prod(self.grid_dimensions)
         else:
-            self.fingerprint_length = 1
+            self.feature_size = 1
             return gaussian_descriptors_np[:, :, :, 3:], np.prod(
                 self.grid_dimensions
             )
diff --git a/mala/descriptors/bispectrum.py b/mala/descriptors/bispectrum.py
index 207fac341..ab8bbff7f 100755
--- a/mala/descriptors/bispectrum.py
+++ b/mala/descriptors/bispectrum.py
@@ -57,11 +57,6 @@ def data_name(self):
         """Get a string that describes the target (for e.g. metadata)."""
         return "Bispectrum"
 
-    @property
-    def feature_size(self):
-        """Get the feature dimension of this data."""
-        return self.fingerprint_length
-
     @staticmethod
     def convert_units(array, in_units="None"):
         """
@@ -144,7 +139,7 @@ def __calculate_lammps(self, outdir, **kwargs):
         self.setup_lammps_tmp_files("bgrid", outdir)
 
         ase.io.write(
-            self.lammps_temporary_input, self.atoms, format=lammps_format
+            self._lammps_temporary_input, self._atoms, format=lammps_format
         )
 
         nx = self.grid_dimensions[0]
@@ -190,7 +185,7 @@ def __calculate_lammps(self, outdir, **kwargs):
             * (self.parameters.bispectrum_twojmax + 4)
         )
         ncoeff = ncoeff // 24  # integer division
-        self.fingerprint_length = ncols0 + ncoeff
+        self.feature_size = ncols0 + ncoeff
 
         # Extract data from LAMMPS calculation.
         # This is different for the parallel and the serial case.
@@ -210,7 +205,7 @@ def __calculate_lammps(self, outdir, **kwargs):
                 lammps_constants.LMP_STYLE_LOCAL,
                 lammps_constants.LMP_SIZE_COLS,
             )
-            if ncols_local != self.fingerprint_length + 3:
+            if ncols_local != self.feature_size + 3:
                 raise Exception("Inconsistent number of features.")
 
             snap_descriptors_np = extract_compute_np(
@@ -235,7 +230,7 @@ def __calculate_lammps(self, outdir, **kwargs):
                 "bgrid",
                 0,
                 2,
-                (nz, ny, nx, self.fingerprint_length),
+                (nz, ny, nx, self.feature_size),
                 use_fp64=use_fp64,
             )
 
@@ -297,13 +292,13 @@ def __calculate_python(self, **kwargs):
             * (self.parameters.bispectrum_twojmax + 4)
         )
         ncoeff = ncoeff // 24  # integer division
-        self.fingerprint_length = ncoeff + 3
+        self.feature_size = ncoeff + 3
         bispectrum_np = np.zeros(
             (
                 self.grid_dimensions[0],
                 self.grid_dimensions[1],
                 self.grid_dimensions[2],
-                self.fingerprint_length,
+                self.feature_size,
             ),
             dtype=np.float64,
         )
@@ -313,16 +308,16 @@ def __calculate_python(self, **kwargs):
 
         # These are technically hyperparameters. We currently simply set them
         # to set values for everything.
-        self.rmin0 = 0.0
-        self.rfac0 = 0.99363
-        self.bzero_flag = False
-        self.wselfall_flag = False
+        self._rmin0 = 0.0
+        self._rfac0 = 0.99363
+        self._bzero_flag = False
+        self._wselfall_flag = False
         # Currently not supported
-        self.bnorm_flag = False
+        self._bnorm_flag = False
         # Currently not supported
-        self.quadraticflag = False
-        self.number_elements = 1
-        self.wself = 1.0
+        self._quadraticflag = False
+        self._python_calculation_number_elements = 1
+        self._wself = 1.0
 
         # What follows is the python implementation of the
         # bispectrum descriptor calculation.
@@ -496,7 +491,7 @@ def __calculate_python(self, **kwargs):
         if self.parameters.descriptors_contain_xyz:
             return bispectrum_np, np.prod(self.grid_dimensions)
         else:
-            self.fingerprint_length -= 3
+            self.feature_size -= 3
             return bispectrum_np[:, :, :, 3:], np.prod(self.grid_dimensions)
 
     ########
@@ -902,10 +897,10 @@ def __compute_ui(self, nr_atoms, atoms_cutoff, distances_cutoff, grid):
         """
         # Precompute and prepare ui stuff
         theta0 = (
-            (distances_cutoff - self.rmin0)
-            * self.rfac0
+            (distances_cutoff - self._rmin0)
+            * self._rfac0
             * np.pi
-            / (self.parameters.bispectrum_cutoff - self.rmin0)
+            / (self.parameters.bispectrum_cutoff - self._rmin0)
         )
         z0 = np.squeeze(distances_cutoff / np.tan(theta0))
 
@@ -986,13 +981,14 @@ def __compute_ui(self, nr_atoms, atoms_cutoff, distances_cutoff, grid):
                 sfac += 1.0
             else:
                 rcutfac = np.pi / (
-                    self.parameters.bispectrum_cutoff - self.rmin0
+                    self.parameters.bispectrum_cutoff - self._rmin0
                 )
                 if nr_atoms > 1:
                     sfac = 0.5 * (
-                        np.cos((distances_cutoff - self.rmin0) * rcutfac) + 1.0
+                        np.cos((distances_cutoff - self._rmin0) * rcutfac)
+                        + 1.0
                     )
-                    sfac[np.where(distances_cutoff <= self.rmin0)] = 1.0
+                    sfac[np.where(distances_cutoff <= self._rmin0)] = 1.0
                     sfac[
                         np.where(
                             distances_cutoff
@@ -1000,8 +996,8 @@ def __compute_ui(self, nr_atoms, atoms_cutoff, distances_cutoff, grid):
                         )
                     ] = 0.0
                 else:
-                    sfac = 1.0 if distances_cutoff <= self.rmin0 else sfac
-                    sfac = 0.0 if distances_cutoff <= self.rmin0 else sfac
+                    sfac = 1.0 if distances_cutoff <= self._rmin0 else sfac
+                    sfac = 0.0 if distances_cutoff <= self._rmin0 else sfac
 
             # sfac technically has to be weighted according to the chemical
             # species. But this is a minimal implementation only for a single
@@ -1099,12 +1095,12 @@ def __compute_bi(self, ulisttot_r, ulisttot_i, zlist_r, zlist_i):
         itriple = 0
         idouble = 0
 
-        if self.bzero_flag:
+        if self._bzero_flag:
             wself = 1.0
             bzero = np.zeros(self.parameters.bispectrum_twojmax + 1)
             www = wself * wself * wself
             for j in range(self.parameters.bispectrum_twojmax + 1):
-                if self.bnorm_flag:
+                if self._bnorm_flag:
                     bzero[j] = www
                 else:
                     bzero[j] = www * (j + 1)
@@ -1158,8 +1154,8 @@ def __compute_bi(self, ulisttot_r, ulisttot_i, zlist_r, zlist_i):
                     itriple += 1
                 idouble += 1
 
-        if self.bzero_flag:
-            if not self.wselfall_flag:
+        if self._bzero_flag:
+            if not self._wselfall_flag:
                 itriple = (
                     ielem * number_elements + ielem
                 ) * number_elements + ielem
@@ -1179,9 +1175,9 @@ def __compute_bi(self, ulisttot_r, ulisttot_i, zlist_r, zlist_i):
                             itriple += 1
 
         # Untested  & Unoptimized
-        if self.quadraticflag:
+        if self._quadraticflag:
             xyz_length = 3 if self.parameters.descriptors_contain_xyz else 0
-            ncount = self.fingerprint_length - xyz_length
+            ncount = self.feature_size - xyz_length
             for icoeff in range(ncount):
                 bveci = blist[icoeff]
                 blist[3 + ncount] = 0.5 * bveci * bveci
diff --git a/mala/descriptors/descriptor.py b/mala/descriptors/descriptor.py
index 17cd9e5b0..041dd4b3f 100644
--- a/mala/descriptors/descriptor.py
+++ b/mala/descriptors/descriptor.py
@@ -36,6 +36,10 @@ class Descriptor(PhysicalData):
     parameters : mala.common.parameters.Parameters
         Parameters object used to create this object.
 
+    Attributes
+    ----------
+    parameters: mala.common.parameters.ParametersDescriptors
+        MALA descriptor calculation parameters.
     """
 
     ##############################
@@ -106,17 +110,16 @@ def __getnewargs__(self):
     def __init__(self, parameters):
         super(Descriptor, self).__init__(parameters)
         self.parameters: ParametersDescriptors = parameters.descriptors
-        self.fingerprint_length = 0  # so iterations will fail
-        self.verbosity = parameters.verbosity
-        self.in_format_ase = ""
-        self.atoms = None
-        self.voxel = None
+        self.feature_size = 0  # so iterations will fail
+        self._in_format_ase = ""
+        self._atoms = None
+        self._voxel = None
 
         # If we ever have NON LAMMPS descriptors, these parameters have no
         # meaning anymore and should probably be moved to an intermediate
         # DescriptorsLAMMPS class, from which the LAMMPS descriptors inherit.
-        self.lammps_temporary_input = None
-        self.lammps_temporary_log = None
+        self._lammps_temporary_input = None
+        self._lammps_temporary_log = None
 
     ##############################
     # Properties
@@ -182,6 +185,15 @@ def convert_units(array, in_units="1/eV"):
             " descriptor type."
         )
 
+    @property
+    def feature_size(self):
+        """Get the feature dimension of this data."""
+        return self._feature_size
+
+    @feature_size.setter
+    def feature_size(self, value):
+        self._feature_size = value
+
     @staticmethod
     def backconvert_units(array, out_units):
         """
@@ -227,24 +239,24 @@ def setup_lammps_tmp_files(self, lammps_type, outdir):
             lammps_tmp_input_file = tempfile.NamedTemporaryFile(
                 delete=False, prefix=prefix_inp_str, suffix="_.tmp", dir=outdir
             )
-            self.lammps_temporary_input = lammps_tmp_input_file.name
+            self._lammps_temporary_input = lammps_tmp_input_file.name
             lammps_tmp_input_file.close()
 
             lammps_tmp_log_file = tempfile.NamedTemporaryFile(
                 delete=False, prefix=prefix_log_str, suffix="_.tmp", dir=outdir
             )
-            self.lammps_temporary_log = lammps_tmp_log_file.name
+            self._lammps_temporary_log = lammps_tmp_log_file.name
             lammps_tmp_log_file.close()
         else:
-            self.lammps_temporary_input = None
-            self.lammps_temporary_log = None
+            self._lammps_temporary_input = None
+            self._lammps_temporary_log = None
 
         if self.parameters._configuration["mpi"]:
-            self.lammps_temporary_input = get_comm().bcast(
-                self.lammps_temporary_input, root=0
+            self._lammps_temporary_input = get_comm().bcast(
+                self._lammps_temporary_input, root=0
             )
-            self.lammps_temporary_log = get_comm().bcast(
-                self.lammps_temporary_log, root=0
+            self._lammps_temporary_log = get_comm().bcast(
+                self._lammps_temporary_log, root=0
             )
 
     # Calculations
@@ -328,13 +340,13 @@ def calculate_from_qe_out(
             (x,y,z,descriptor_dimension)
 
         """
-        self.in_format_ase = "espresso-out"
+        self._in_format_ase = "espresso-out"
         printout("Calculating descriptors from", qe_out_file, min_verbosity=0)
         # We get the atomic information by using ASE.
-        self.atoms = ase.io.read(qe_out_file, format=self.in_format_ase)
+        self._atoms = ase.io.read(qe_out_file, format=self._in_format_ase)
 
         # Enforcing / Checking PBC on the read atoms.
-        self.atoms = self.enforce_pbc(self.atoms)
+        self._atoms = self.enforce_pbc(self._atoms)
 
         # Get the grid dimensions.
         if "grid_dimensions" in kwargs.keys():
@@ -356,10 +368,10 @@ def calculate_from_qe_out(
                     self.grid_dimensions[2] = int(tmp.split(",")[2])
                     break
 
-        self.voxel = self.atoms.cell.copy()
-        self.voxel[0] = self.voxel[0] / (self.grid_dimensions[0])
-        self.voxel[1] = self.voxel[1] / (self.grid_dimensions[1])
-        self.voxel[2] = self.voxel[2] / (self.grid_dimensions[2])
+        self._voxel = self._atoms.cell.copy()
+        self._voxel[0] = self._voxel[0] / (self.grid_dimensions[0])
+        self._voxel[1] = self._voxel[1] / (self.grid_dimensions[1])
+        self._voxel[2] = self._voxel[2] / (self.grid_dimensions[2])
 
         return self._calculate(working_directory, **kwargs)
 
@@ -400,12 +412,12 @@ def calculate_from_atoms(
             (x,y,z,descriptor_dimension)
         """
         # Enforcing / Checking PBC on the input atoms.
-        self.atoms = self.enforce_pbc(atoms)
+        self._atoms = self.enforce_pbc(atoms)
         self.grid_dimensions = grid_dimensions
-        self.voxel = self.atoms.cell.copy()
-        self.voxel[0] = self.voxel[0] / (self.grid_dimensions[0])
-        self.voxel[1] = self.voxel[1] / (self.grid_dimensions[1])
-        self.voxel[2] = self.voxel[2] / (self.grid_dimensions[2])
+        self._voxel = self._atoms.cell.copy()
+        self._voxel[0] = self._voxel[0] / (self.grid_dimensions[0])
+        self._voxel[1] = self._voxel[1] / (self.grid_dimensions[1])
+        self._voxel[2] = self._voxel[2] / (self.grid_dimensions[2])
         return self._calculate(working_directory, **kwargs)
 
     def gather_descriptors(self, descriptors_np, use_pickled_comm=False):
@@ -445,7 +457,7 @@ def gather_descriptors(self, descriptors_np, use_pickled_comm=False):
             sendcounts = np.array(
                 comm.gather(np.shape(descriptors_np)[0], root=0)
             )
-            raw_feature_length = self.fingerprint_length + 3
+            raw_feature_length = self.feature_size + 3
 
             if get_rank() == 0:
                 # print("sendcounts: {}, total: {}".format(sendcounts,
@@ -490,7 +502,7 @@ def gather_descriptors(self, descriptors_np, use_pickled_comm=False):
             nx = self.grid_dimensions[0]
             ny = self.grid_dimensions[1]
             nz = self.grid_dimensions[2]
-            descriptors_full = np.zeros([nx, ny, nz, self.fingerprint_length])
+            descriptors_full = np.zeros([nx, ny, nz, self.feature_size])
             # Fill the full bispectrum descriptors array.
             for idx, local_grid in enumerate(all_descriptors_list):
                 # We glue the individual cells back together, and transpose.
@@ -508,7 +520,7 @@ def gather_descriptors(self, descriptors_np, use_pickled_comm=False):
                         last_z - first_z,
                         last_y - first_y,
                         last_x - first_x,
-                        self.fingerprint_length,
+                        self.feature_size,
                     ],
                 ).transpose(
                     [2, 1, 0, 3]
@@ -554,10 +566,10 @@ def convert_local_to_3d(self, descriptors_np):
         ny = local_reach[1] - local_offset[1]
         nz = local_reach[2] - local_offset[2]
 
-        descriptors_full = np.zeros([nx, ny, nz, self.fingerprint_length])
+        descriptors_full = np.zeros([nx, ny, nz, self.feature_size])
 
         descriptors_full[0:nx, 0:ny, 0:nz] = np.reshape(
-            descriptors_np[:, 3:], [nz, ny, nx, self.fingerprint_length]
+            descriptors_np[:, 3:], [nz, ny, nx, self.feature_size]
         ).transpose([2, 1, 0, 3])
         return descriptors_full, local_offset, local_reach
 
@@ -580,20 +592,20 @@ def _process_loaded_dimensions(self, array_dimensions):
 
     def _set_geometry_info(self, mesh):
         # Geometry: Save the cell parameters and angles of the grid.
-        if self.atoms is not None:
+        if self._atoms is not None:
             import openpmd_api as io
 
-            self.voxel = self.atoms.cell.copy()
-            self.voxel[0] = self.voxel[0] / (self.grid_dimensions[0])
-            self.voxel[1] = self.voxel[1] / (self.grid_dimensions[1])
-            self.voxel[2] = self.voxel[2] / (self.grid_dimensions[2])
+            self._voxel = self._atoms.cell.copy()
+            self._voxel[0] = self._voxel[0] / (self.grid_dimensions[0])
+            self._voxel[1] = self._voxel[1] / (self.grid_dimensions[1])
+            self._voxel[2] = self._voxel[2] / (self.grid_dimensions[2])
 
             mesh.geometry = io.Geometry.cartesian
-            mesh.grid_spacing = self.voxel.cellpar()[0:3]
-            mesh.set_attribute("angles", self.voxel.cellpar()[3:])
+            mesh.grid_spacing = self._voxel.cellpar()[0:3]
+            mesh.set_attribute("angles", self._voxel.cellpar()[3:])
 
     def _get_atoms(self):
-        return self.atoms
+        return self._atoms
 
     def _feature_mask(self):
         if self.descriptors_contain_xyz:
@@ -614,9 +626,9 @@ def _setup_lammps(self, nx, ny, nz, lammps_dict):
             "-screen",
             "none",
             "-log",
-            self.lammps_temporary_log,
+            self._lammps_temporary_log,
         ]
-        lammps_dict["atom_config_fname"] = self.lammps_temporary_input
+        lammps_dict["atom_config_fname"] = self._lammps_temporary_input
 
         if self.parameters._configuration["mpi"]:
             size = get_size()
@@ -833,8 +845,8 @@ def _clean_calculation(self, lmp, keep_logs):
         lmp.close()
         if not keep_logs:
             if get_rank() == 0:
-                os.remove(self.lammps_temporary_log)
-                os.remove(self.lammps_temporary_input)
+                os.remove(self._lammps_temporary_log)
+                os.remove(self._lammps_temporary_input)
 
     def _setup_atom_list(self):
         """
@@ -847,7 +859,7 @@ def _setup_atom_list(self):
         FURTHER OPTIMIZATION: Probably not that much, this mostly already uses
         optimized python functions.
         """
-        if np.any(self.atoms.pbc):
+        if np.any(self._atoms.pbc):
 
             # To determine the list of relevant atoms we first take the edges
             # of the simulation cell and use them to determine all cells
@@ -874,19 +886,19 @@ def _setup_atom_list(self):
             for edge in edges:
                 edge_point = self._grid_to_coord(edge)
                 neighborlist = NeighborList(
-                    np.zeros(len(self.atoms) + 1)
+                    np.zeros(len(self._atoms) + 1)
                     + [self.parameters.atomic_density_cutoff],
                     bothways=True,
                     self_interaction=False,
                     primitive=NewPrimitiveNeighborList,
                 )
 
-                atoms_with_grid_point = self.atoms.copy()
+                atoms_with_grid_point = self._atoms.copy()
 
                 # Construct a ghost atom representing the grid point.
                 atoms_with_grid_point.append(ase.Atom("H", edge_point))
                 neighborlist.update(atoms_with_grid_point)
-                indices, offsets = neighborlist.get_neighbors(len(self.atoms))
+                indices, offsets = neighborlist.get_neighbors(len(self._atoms))
 
                 # Incrementally fill the list containing all cells to be
                 # considered.
@@ -911,18 +923,18 @@ def _setup_atom_list(self):
             # First, instantiate it by filling it will all atoms from all
             # potentiall relevant cells, as identified above.
             all_atoms = None
-            for a in range(0, len(self.atoms)):
+            for a in range(0, len(self._atoms)):
                 if all_atoms is None:
                     all_atoms = (
-                        self.atoms.positions[a]
-                        + all_cells @ self.atoms.get_cell()
+                        self._atoms.positions[a]
+                        + all_cells @ self._atoms.get_cell()
                     )
                 else:
                     all_atoms = np.concatenate(
                         (
                             all_atoms,
-                            self.atoms.positions[a]
-                            + all_cells @ self.atoms.get_cell(),
+                            self._atoms.positions[a]
+                            + all_cells @ self._atoms.get_cell(),
                         )
                     )
 
@@ -975,11 +987,11 @@ def _setup_atom_list(self):
                     :,
                 ]
             )
-            return np.concatenate((all_atoms, self.atoms.positions))
+            return np.concatenate((all_atoms, self._atoms.positions))
 
         else:
             # If no PBC are used, only consider a single cell.
-            return self.atoms.positions
+            return self._atoms.positions
 
     def _grid_to_coord(self, gridpoint):
         # Convert grid indices to real space grid point.
@@ -989,20 +1001,20 @@ def _grid_to_coord(self, gridpoint):
         # Orthorhombic cells and triclinic ones have
         # to be treated differently, see domain.cpp
 
-        if self.atoms.cell.orthorhombic:
-            return np.diag(self.voxel) * [i, j, k]
+        if self._atoms.cell.orthorhombic:
+            return np.diag(self._voxel) * [i, j, k]
         else:
             ret = [0, 0, 0]
             ret[0] = (
-                i / self.grid_dimensions[0] * self.atoms.cell[0, 0]
-                + j / self.grid_dimensions[1] * self.atoms.cell[1, 0]
-                + k / self.grid_dimensions[2] * self.atoms.cell[2, 0]
+                i / self.grid_dimensions[0] * self._atoms.cell[0, 0]
+                + j / self.grid_dimensions[1] * self._atoms.cell[1, 0]
+                + k / self.grid_dimensions[2] * self._atoms.cell[2, 0]
             )
             ret[1] = (
-                j / self.grid_dimensions[1] * self.atoms.cell[1, 1]
-                + k / self.grid_dimensions[2] * self.atoms.cell[1, 2]
+                j / self.grid_dimensions[1] * self._atoms.cell[1, 1]
+                + k / self.grid_dimensions[2] * self._atoms.cell[1, 2]
             )
-            ret[2] = k / self.grid_dimensions[2] * self.atoms.cell[2, 2]
+            ret[2] = k / self.grid_dimensions[2] * self._atoms.cell[2, 2]
             return np.array(ret)
 
     @abstractmethod
@@ -1010,4 +1022,4 @@ def _calculate(self, outdir, **kwargs):
         pass
 
     def _set_feature_size_from_array(self, array):
-        self.fingerprint_length = np.shape(array)[-1]
+        self.feature_size = np.shape(array)[-1]
diff --git a/mala/descriptors/minterpy_descriptors.py b/mala/descriptors/minterpy_descriptors.py
index 55fd69de4..2d9d52168 100755
--- a/mala/descriptors/minterpy_descriptors.py
+++ b/mala/descriptors/minterpy_descriptors.py
@@ -1,4 +1,4 @@
-"""Gaussian descriptor class."""
+"""Minterpy descriptor class."""
 
 import os
 
@@ -10,10 +10,14 @@
 from mala.descriptors.lammps_utils import extract_compute_np
 from mala.descriptors.descriptor import Descriptor
 from mala.descriptors.atomic_density import AtomicDensity
+from mala.common.parallelizer import parallel_warn
 
 
 class MinterpyDescriptors(Descriptor):
-    """Class for calculation and parsing of Gaussian descriptors.
+    """
+    Class for calculation and parsing of Minterpy descriptors.
+
+    Marked for deprecation.
 
     Parameters
     ----------
@@ -23,18 +27,16 @@ class MinterpyDescriptors(Descriptor):
 
     def __init__(self, parameters):
         super(MinterpyDescriptors, self).__init__(parameters)
-        self.verbosity = parameters.verbosity
+        parallel_warn(
+            "Minterpy descriptors will be deprecated starting with MALA v1.4.0",
+            category=FutureWarning,
+        )
 
     @property
     def data_name(self):
         """Get a string that describes the target (for e.g. metadata)."""
         return "Minterpy"
 
-    @property
-    def feature_size(self):
-        """Get the feature dimension of this data."""
-        return self.fingerprint_length
-
     @staticmethod
     def convert_units(array, in_units="None"):
         """
@@ -149,11 +151,11 @@ def _calculate(self, atoms, outdir, grid_dimensions, **kwargs):
             ],
             dtype=np.float64,
         )
-        self.fingerprint_length = (
+        self.feature_size = (
             len(self.parameters.minterpy_point_list) + coord_length
         )
 
-        self.fingerprint_length = len(self.parameters.minterpy_point_list)
+        self.feature_size = len(self.parameters.minterpy_point_list)
         # Perform one LAMMPS call for each point in the Minterpy point list.
         for idx, point in enumerate(self.parameters.minterpy_point_list):
             # Shift the atoms in negative direction of the point(s) we actually
@@ -166,7 +168,7 @@ def _calculate(self, atoms, outdir, grid_dimensions, **kwargs):
             self.setup_lammps_tmp_files("minterpy", outdir)
 
             ase.io.write(
-                self.lammps_temporary_input, self.atoms, format=lammps_format
+                self._lammps_temporary_input, self._atoms, format=lammps_format
             )
 
             # Create LAMMPS instance.
diff --git a/mala/network/predictor.py b/mala/network/predictor.py
index 785671dc0..440929906 100644
--- a/mala/network/predictor.py
+++ b/mala/network/predictor.py
@@ -139,7 +139,7 @@ def predict_for_atoms(self, atoms, gather_ldos=False, temperature=None):
         self.data.target_calculator.read_additional_calculation_data(
             [atoms, self.data.grid_dimension], "atoms+grid"
         )
-        feature_length = self.data.descriptor_calculator.fingerprint_length
+        feature_length = self.data.descriptor_calculator.feature_size
 
         # The actual calculation of the LDOS from the descriptors depends
         # on whether we run in parallel or serial. In the former case,
diff --git a/test/all_lazy_loading_test.py b/test/all_lazy_loading_test.py
index 4e7661bff..5130266a7 100644
--- a/test/all_lazy_loading_test.py
+++ b/test/all_lazy_loading_test.py
@@ -110,34 +110,34 @@ def test_scaling(self):
                     # I presume to be due to numerical constraints. To make a
                     # meaningful comparison it is wise to scale the value here.
                     this_result.append(
-                        data_handler.input_data_scaler._total_mean
+                        data_handler.input_data_scaler.total_mean
                         / data_handler.nr_training_data
                     )
                     this_result.append(
-                        data_handler.input_data_scaler._total_std
+                        data_handler.input_data_scaler.total_std
                         / data_handler.nr_training_data
                     )
                     this_result.append(
-                        data_handler.output_data_scaler._total_mean
+                        data_handler.output_data_scaler.total_mean
                         / data_handler.nr_training_data
                     )
                     this_result.append(
-                        data_handler.output_data_scaler._total_std
+                        data_handler.output_data_scaler.total_std
                         / data_handler.nr_training_data
                     )
                 elif scalingtype == "normal":
                     torch.manual_seed(2002)
                     this_result.append(
-                        data_handler.input_data_scaler._total_max
+                        data_handler.input_data_scaler.total_max
                     )
                     this_result.append(
-                        data_handler.input_data_scaler._total_min
+                        data_handler.input_data_scaler.total_min
                     )
                     this_result.append(
-                        data_handler.output_data_scaler._total_max
+                        data_handler.output_data_scaler.total_max
                     )
                     this_result.append(
-                        data_handler.output_data_scaler._total_min
+                        data_handler.output_data_scaler.total_min
                     )
                     dataset_tester.append(
                         (data_handler.training_data_sets[0][3998])[0].sum()
@@ -165,41 +165,41 @@ def test_scaling(self):
                     # I presume to be due to numerical constraints. To make a
                     # meaningful comparison it is wise to scale the value here.
                     this_result.append(
-                        torch.mean(data_handler.input_data_scaler._means)
+                        torch.mean(data_handler.input_data_scaler.means)
                         / data_handler.parameters.snapshot_directories_list[
                             0
                         ].grid_size
                     )
                     this_result.append(
-                        torch.mean(data_handler.input_data_scaler._stds)
+                        torch.mean(data_handler.input_data_scaler.stds)
                         / data_handler.parameters.snapshot_directories_list[
                             0
                         ].grid_size
                     )
                     this_result.append(
-                        torch.mean(data_handler.output_data_scaler._means)
+                        torch.mean(data_handler.output_data_scaler.means)
                         / data_handler.parameters.snapshot_directories_list[
                             0
                         ].grid_size
                     )
                     this_result.append(
-                        torch.mean(data_handler.output_data_scaler._stds)
+                        torch.mean(data_handler.output_data_scaler.stds)
                         / data_handler.parameters.snapshot_directories_list[
                             0
                         ].grid_size
                     )
                 elif scalingtype == "feature-wise-normal":
                     this_result.append(
-                        torch.mean(data_handler.input_data_scaler._maxs)
+                        torch.mean(data_handler.input_data_scaler.maxs)
                     )
                     this_result.append(
-                        torch.mean(data_handler.input_data_scaler._mins)
+                        torch.mean(data_handler.input_data_scaler.mins)
                     )
                     this_result.append(
-                        torch.mean(data_handler.output_data_scaler._maxs)
+                        torch.mean(data_handler.output_data_scaler.maxs)
                     )
                     this_result.append(
-                        torch.mean(data_handler.output_data_scaler._mins)
+                        torch.mean(data_handler.output_data_scaler.mins)
                     )
 
                 comparison.append(this_result)
diff --git a/test/complete_interfaces_test.py b/test/complete_interfaces_test.py
index 4ceb691d8..300d6302f 100644
--- a/test/complete_interfaces_test.py
+++ b/test/complete_interfaces_test.py
@@ -117,7 +117,7 @@ def test_convert_numpy_openpmd(self):
             descriptor_save_path="./",
             target_save_path="./",
             additional_info_save_path="./",
-            naming_scheme="converted_from_numpy_*.bp5",
+            naming_scheme="converted_from_numpy_*.h5",
             descriptor_calculation_kwargs={"working_directory": "./"},
         )
 
@@ -128,11 +128,13 @@ def test_convert_numpy_openpmd(self):
         for snapshot in range(2):
             data_converter.add_snapshot(
                 descriptor_input_type="openpmd",
-                descriptor_input_path="converted_from_numpy_{}.in.bp5".format(
+                descriptor_input_path="converted_from_numpy_{}.in.h5".format(
                     snapshot
                 ),
                 target_input_type="openpmd",
-                target_input_path="converted_from_numpy_{}.out.bp5".format(snapshot),
+                target_input_path="converted_from_numpy_{}.out.h5".format(
+                    snapshot
+                ),
                 additional_info_input_type=None,
                 additional_info_input_path=None,
                 target_units=None,
@@ -151,8 +153,10 @@ def test_convert_numpy_openpmd(self):
                 original = os.path.join(
                     data_path, "Be_snapshot{}.{}.npy".format(snapshot, i_o)
                 )
-                roundtrip = "verify_against_original_numpy_data_{}.{}.npy".format(
-                    snapshot, i_o
+                roundtrip = (
+                    "verify_against_original_numpy_data_{}.{}.npy".format(
+                        snapshot, i_o
+                    )
                 )
                 import numpy as np
 

From 3d8db6ddfc8f68be4d59ed38cf2c3c1a66422f74 Mon Sep 17 00:00:00 2001
From: Lenz Fiedler <l.fiedler@hzdr.de>
Date: Mon, 25 Nov 2024 15:56:12 +0100
Subject: [PATCH 12/21] Finished hyperparameter optimization classes

---
 mala/interfaces/ase_calculator.py |  51 ++++++--
 mala/network/acsd_analyzer.py     | 108 ++++++++--------
 mala/network/hyper_opt.py         |  20 +--
 mala/network/hyper_opt_naswot.py  | 174 +++++++++++++++-----------
 mala/network/hyper_opt_oat.py     | 197 +++++++++++++++++-------------
 mala/network/hyper_opt_optuna.py  |  29 ++++-
 test/complete_interfaces_test.py  |   2 +-
 test/hyperopt_test.py             |   2 +-
 test/inference_test.py            |   4 +-
 9 files changed, 349 insertions(+), 238 deletions(-)

diff --git a/mala/interfaces/ase_calculator.py b/mala/interfaces/ase_calculator.py
index 1ccd73d3a..941f36b7f 100644
--- a/mala/interfaces/ase_calculator.py
+++ b/mala/interfaces/ase_calculator.py
@@ -34,9 +34,24 @@ class MALA(Calculator):
         the neural network), calculator can access all important data such as
         temperature, number of electrons, etc. that might not be known simply
         from the atomic positions.
+
+    predictor : mala.network.predictor.Predictor
+        A Predictor class object to be used for the underlying MALA
+        predictions.
+
+    Attributes
+    ----------
+    mala_parameters : mala.common.parameters.Parameters
+        MALA parameters used for predictions.
+
+    last_energy_contributions : dict
+        Contains all total energy contributions for the last prediction.
+
+    implemented_properties : list
+        List of which properties can be computed by this calculator.
     """
 
-    implemented_properties = ["energy", "forces"]
+    implemented_properties = ["energy"]
 
     def __init__(
         self,
@@ -55,21 +70,21 @@ def __init__(
                 "The MALA calculator currently only works with the LDOS."
             )
 
-        self.network: Network = network
-        self.data_handler: DataHandler = data
+        self._network: Network = network
+        self._data_handler: DataHandler = data
 
         # Prepare for prediction.
         if predictor is None:
-            self.predictor = Predictor(
-                self.mala_parameters, self.network, self.data_handler
+            self._predictor = Predictor(
+                self.mala_parameters, self._network, self._data_handler
             )
         else:
-            self.predictor = predictor
+            self._predictor = predictor
 
         if reference_data is not None:
             # Get critical values from a reference file (cutoff,
             # temperature, etc.)
-            self.data_handler.target_calculator.read_additional_calculation_data(
+            self._data_handler.target_calculator.read_additional_calculation_data(
                 reference_data
             )
 
@@ -91,6 +106,11 @@ def load_model(cls, run_name, path="./"):
 
         path : str
             Path where the model is saved.
+
+        Returns
+        -------
+        calculator : mala.interfaces.calculator.Calculator
+            The calculator object.
         """
         parallel_warn(
             "MALA.load_model() will be deprecated in MALA v1.4.0."
@@ -115,6 +135,11 @@ def load_run(cls, run_name, path="./"):
 
         path : str
             Path where the model is saved.
+
+        Returns
+        -------
+        calculator : mala.interfaces.calculator.Calculator
+            The calculator object.
         """
         loaded_params, loaded_network, new_datahandler, loaded_runner = (
             Predictor.load_run(run_name, path=path)
@@ -152,10 +177,10 @@ def calculate(
         Calculator.calculate(self, atoms, properties, system_changes)
 
         # Get the LDOS from the NN.
-        ldos = self.predictor.predict_for_atoms(atoms)
+        ldos = self._predictor.predict_for_atoms(atoms)
 
         # Use the LDOS determined DOS and density to get energy and forces.
-        ldos_calculator: LDOS = self.data_handler.target_calculator
+        ldos_calculator: LDOS = self._data_handler.target_calculator
         ldos_calculator.read_from_array(ldos)
         self.results["energy"] = ldos_calculator.total_energy
         energy, self.last_energy_contributions = (
@@ -197,19 +222,19 @@ def calculate_properties(self, atoms, properties):
 
         if "rdf" in properties:
             self.results["rdf"] = (
-                self.data_handler.target_calculator.get_radial_distribution_function(
+                self._data_handler.target_calculator.get_radial_distribution_function(
                     atoms
                 )
             )
         if "tpcf" in properties:
             self.results["tpcf"] = (
-                self.data_handler.target_calculator.get_three_particle_correlation_function(
+                self._data_handler.target_calculator.get_three_particle_correlation_function(
                     atoms
                 )
             )
         if "static_structure_factor" in properties:
             self.results["static_structure_factor"] = (
-                self.data_handler.target_calculator.get_static_structure_factor(
+                self._data_handler.target_calculator.get_static_structure_factor(
                     atoms
                 )
             )
@@ -233,6 +258,6 @@ def save_calculator(self, filename, path="./"):
             Path where the calculator should be saved.
 
         """
-        self.predictor.save_run(
+        self._predictor.save_run(
             filename, path=path, additional_calculation_data=True
         )
diff --git a/mala/network/acsd_analyzer.py b/mala/network/acsd_analyzer.py
index b9bcba60a..317a425f1 100644
--- a/mala/network/acsd_analyzer.py
+++ b/mala/network/acsd_analyzer.py
@@ -49,16 +49,18 @@ def __init__(
     ):
         super(ACSDAnalyzer, self).__init__(params)
         # Calculators used to parse data from compatible files.
-        self.target_calculator = target_calculator
-        if self.target_calculator is None:
-            self.target_calculator = Target(params)
-        self.descriptor_calculator = descriptor_calculator
-        if self.descriptor_calculator is None:
-            self.descriptor_calculator = Descriptor(params)
+        self._target_calculator = target_calculator
+        if self._target_calculator is None:
+            self._target_calculator = Target(params)
+        self._descriptor_calculator = descriptor_calculator
+        if self._descriptor_calculator is None:
+            self._descriptor_calculator = Descriptor(params)
         if (
-            not isinstance(self.descriptor_calculator, Bispectrum)
-            and not isinstance(self.descriptor_calculator, AtomicDensity)
-            and not isinstance(self.descriptor_calculator, MinterpyDescriptors)
+            not isinstance(self._descriptor_calculator, Bispectrum)
+            and not isinstance(self._descriptor_calculator, AtomicDensity)
+            and not isinstance(
+                self._descriptor_calculator, MinterpyDescriptors
+            )
         ):
             raise Exception(
                 "Cannot calculate ACSD for the selected descriptors."
@@ -70,10 +72,10 @@ def __init__(
         self.__snapshot_units = []
 
         # Filled after the analysis.
-        self.labels = []
-        self.study = []
-        self.reduced_study = None
-        self.internal_hyperparam_list = None
+        self._labels = []
+        self._study = []
+        self._reduced_study = None
+        self._internal_hyperparam_list = None
 
     def add_snapshot(
         self,
@@ -189,7 +191,7 @@ def perform_study(
         # Prepare the hyperparameter lists.
         self._construct_hyperparam_list()
         hyperparameter_tuples = list(
-            itertools.product(*self.internal_hyperparam_list)
+            itertools.product(*self._internal_hyperparam_list)
         )
 
         # Perform the ACSD analysis separately for each snapshot.
@@ -208,14 +210,14 @@ def perform_study(
             )
 
             for idx, hyperparameter_tuple in enumerate(hyperparameter_tuples):
-                if isinstance(self.descriptor_calculator, Bispectrum):
+                if isinstance(self._descriptor_calculator, Bispectrum):
                     self.params.descriptors.bispectrum_cutoff = (
                         hyperparameter_tuple[0]
                     )
                     self.params.descriptors.bispectrum_twojmax = (
                         hyperparameter_tuple[1]
                     )
-                elif isinstance(self.descriptor_calculator, AtomicDensity):
+                elif isinstance(self._descriptor_calculator, AtomicDensity):
                     self.params.descriptors.atomic_density_cutoff = (
                         hyperparameter_tuple[0]
                     )
@@ -223,7 +225,7 @@ def perform_study(
                         hyperparameter_tuple[1]
                     )
                 elif isinstance(
-                    self.descriptor_calculator, MinterpyDescriptors
+                    self._descriptor_calculator, MinterpyDescriptors
                 ):
                     self.params.descriptors.atomic_density_cutoff = (
                         hyperparameter_tuple[0]
@@ -269,11 +271,11 @@ def perform_study(
                         )
 
                     outstring = "["
-                    for label_id, label in enumerate(self.labels):
+                    for label_id, label in enumerate(self._labels):
                         outstring += (
                             label + ": " + str(hyperparameter_tuple[label_id])
                         )
-                        if label_id < len(self.labels) - 1:
+                        if label_id < len(self._labels) - 1:
                             outstring += ", "
                     outstring += "]"
                     best_trial_string = ". No suitable trial found yet."
@@ -295,34 +297,34 @@ def perform_study(
                     )
 
             if get_rank() == 0:
-                self.study.append(current_list)
+                self._study.append(current_list)
 
         if get_rank() == 0:
-            self.study = np.mean(self.study, axis=0)
+            self._study = np.mean(self._study, axis=0)
 
             # TODO: Does this even make sense for the minterpy descriptors?
             if return_plotting:
                 results_to_plot = []
-                if len(self.internal_hyperparam_list) == 2:
-                    len_first_dim = len(self.internal_hyperparam_list[0])
-                    len_second_dim = len(self.internal_hyperparam_list[1])
+                if len(self._internal_hyperparam_list) == 2:
+                    len_first_dim = len(self._internal_hyperparam_list[0])
+                    len_second_dim = len(self._internal_hyperparam_list[1])
                     for i in range(0, len_first_dim):
                         results_to_plot.append(
-                            self.study[
+                            self._study[
                                 i * len_second_dim : (i + 1) * len_second_dim,
                                 2:,
                             ]
                         )
 
-                    if isinstance(self.descriptor_calculator, Bispectrum):
+                    if isinstance(self._descriptor_calculator, Bispectrum):
                         return results_to_plot, {
-                            "twojmax": self.internal_hyperparam_list[1],
-                            "cutoff": self.internal_hyperparam_list[0],
+                            "twojmax": self._internal_hyperparam_list[1],
+                            "cutoff": self._internal_hyperparam_list[0],
                         }
-                    if isinstance(self.descriptor_calculator, AtomicDensity):
+                    if isinstance(self._descriptor_calculator, AtomicDensity):
                         return results_to_plot, {
-                            "sigma": self.internal_hyperparam_list[1],
-                            "cutoff": self.internal_hyperparam_list[0],
+                            "sigma": self._internal_hyperparam_list[1],
+                            "cutoff": self._internal_hyperparam_list[0],
                         }
 
     def set_optimal_parameters(self):
@@ -333,9 +335,9 @@ def set_optimal_parameters(self):
         hyperparameter optimizer was created.
         """
         if get_rank() == 0:
-            minimum_acsd = self.study[np.argmin(self.study[:, -1])]
-            if len(self.internal_hyperparam_list) == 2:
-                if isinstance(self.descriptor_calculator, Bispectrum):
+            minimum_acsd = self._study[np.argmin(self._study[:, -1])]
+            if len(self._internal_hyperparam_list) == 2:
+                if isinstance(self._descriptor_calculator, Bispectrum):
                     self.params.descriptors.bispectrum_cutoff = minimum_acsd[0]
                     self.params.descriptors.bispectrum_twojmax = int(
                         minimum_acsd[1]
@@ -351,7 +353,7 @@ def set_optimal_parameters(self):
                         "Bispectrum cutoff: ",
                         self.params.descriptors.bispectrum_cutoff,
                     )
-                if isinstance(self.descriptor_calculator, AtomicDensity):
+                if isinstance(self._descriptor_calculator, AtomicDensity):
                     self.params.descriptors.atomic_density_cutoff = (
                         minimum_acsd[0]
                     )
@@ -369,8 +371,10 @@ def set_optimal_parameters(self):
                         "Atomic density cutoff: ",
                         self.params.descriptors.atomic_density_cutoff,
                     )
-            elif len(self.internal_hyperparam_list) == 5:
-                if isinstance(self.descriptor_calculator, MinterpyDescriptors):
+            elif len(self._internal_hyperparam_list) == 5:
+                if isinstance(
+                    self._descriptor_calculator, MinterpyDescriptors
+                ):
                     self.params.descriptors.atomic_density_cutoff = (
                         minimum_acsd[0]
                     )
@@ -411,7 +415,7 @@ def set_optimal_parameters(self):
                     )
 
     def _construct_hyperparam_list(self):
-        if isinstance(self.descriptor_calculator, Bispectrum):
+        if isinstance(self._descriptor_calculator, Bispectrum):
             if (
                 list(
                     map(
@@ -452,10 +456,10 @@ def _construct_hyperparam_list(self):
                     ).index(True)
                 ].choices
 
-            self.internal_hyperparam_list = [first_dim_list, second_dim_list]
-            self.labels = ["cutoff", "twojmax"]
+            self._internal_hyperparam_list = [first_dim_list, second_dim_list]
+            self._labels = ["cutoff", "twojmax"]
 
-        elif isinstance(self.descriptor_calculator, AtomicDensity):
+        elif isinstance(self._descriptor_calculator, AtomicDensity):
             if (
                 list(
                     map(
@@ -499,10 +503,10 @@ def _construct_hyperparam_list(self):
                         )
                     ).index(True)
                 ].choices
-            self.internal_hyperparam_list = [first_dim_list, second_dim_list]
-            self.labels = ["cutoff", "sigma"]
+            self._internal_hyperparam_list = [first_dim_list, second_dim_list]
+            self._labels = ["cutoff", "sigma"]
 
-        elif isinstance(self.descriptor_calculator, MinterpyDescriptors):
+        elif isinstance(self._descriptor_calculator, MinterpyDescriptors):
             if (
                 list(
                     map(
@@ -611,14 +615,14 @@ def _construct_hyperparam_list(self):
                     ).index(True)
                 ].choices
 
-            self.internal_hyperparam_list = [
+            self._internal_hyperparam_list = [
                 first_dim_list,
                 second_dim_list,
                 third_dim_list,
                 fourth_dim_list,
                 fifth_dim_list,
             ]
-            self.labels = [
+            self._labels = [
                 "cutoff",
                 "sigma",
                 "minterpy_cutoff",
@@ -638,7 +642,7 @@ def _calculate_descriptors(self, snapshot, description, original_units):
         if description["input"] == "espresso-out":
             descriptor_calculation_kwargs["units"] = original_units["input"]
             tmp_input, local_size = (
-                self.descriptor_calculator.calculate_from_qe_out(
+                self._descriptor_calculator.calculate_from_qe_out(
                     snapshot["input"], **descriptor_calculation_kwargs
                 )
             )
@@ -652,7 +656,7 @@ def _calculate_descriptors(self, snapshot, description, original_units):
                 "Unknown file extension, cannot convert descriptor"
             )
         if self.params.descriptors._configuration["mpi"]:
-            tmp_input = self.descriptor_calculator.gather_descriptors(
+            tmp_input = self._descriptor_calculator.gather_descriptors(
                 tmp_input
             )
 
@@ -676,7 +680,7 @@ def _load_target(
             target_calculator_kwargs["units"] = original_units["output"]
             target_calculator_kwargs["use_memmap"] = memmap
             # If no units are provided we just assume standard units.
-            tmp_output = self.target_calculator.read_from_cube(
+            tmp_output = self._target_calculator.read_from_cube(
                 snapshot["output"], **target_calculator_kwargs
             )
 
@@ -684,19 +688,19 @@ def _load_target(
             target_calculator_kwargs["units"] = original_units["output"]
             target_calculator_kwargs["use_memmap"] = memmap
             # If no units are provided we just assume standard units.
-            tmp_output = self.target_calculator.read_from_xsf(
+            tmp_output = self._target_calculator.read_from_xsf(
                 snapshot["output"], **target_calculator_kwargs
             )
 
         elif description["output"] == "numpy":
             if get_rank() == 0:
-                tmp_output = self.target_calculator.read_from_numpy_file(
+                tmp_output = self._target_calculator.read_from_numpy_file(
                     snapshot["output"], units=original_units["output"]
                 )
 
         elif description["output"] == "openpmd":
             if get_rank() == 0:
-                tmp_output = self.target_calculator.read_from_numpy_file(
+                tmp_output = self._target_calculator.read_from_numpy_file(
                     snapshot["output"], units=original_units["output"]
                 )
         else:
diff --git a/mala/network/hyper_opt.py b/mala/network/hyper_opt.py
index c26e93a81..2311c2ad1 100644
--- a/mala/network/hyper_opt.py
+++ b/mala/network/hyper_opt.py
@@ -24,6 +24,11 @@ class HyperOpt(ABC):
 
     use_pkl_checkpoints : bool
         If true, .pkl checkpoints will be created.
+
+    Attributes
+    ----------
+    params : mala.common.parametes.Parameters
+        MALA Parameters object.
     """
 
     def __new__(cls, params: Parameters, data=None, use_pkl_checkpoints=False):
@@ -73,9 +78,9 @@ def __init__(
         self, params: Parameters, data=None, use_pkl_checkpoints=False
     ):
         self.params: Parameters = params
-        self.data_handler = data
-        self.objective = ObjectiveBase(self.params, self.data_handler)
-        self.use_pkl_checkpoints = use_pkl_checkpoints
+        self._data_handler = data
+        self._objective = ObjectiveBase(self.params, self._data_handler)
+        self._use_pkl_checkpoints = use_pkl_checkpoints
 
     def add_hyperparameter(
         self, opttype="float", name="", low=0, high=0, choices=None
@@ -153,7 +158,7 @@ def set_parameters(self, trial):
         The parameters will be written to the parameter object with which the
         hyperparameter optimizer was created.
         """
-        self.objective.parse_trial(trial)
+        self._objective.parse_trial(trial)
 
     def _save_params_and_scaler(self):
         # Saving the Scalers is straight forward.
@@ -163,12 +168,12 @@ def _save_params_and_scaler(self):
         oscaler_name = (
             self.params.hyperparameters.checkpoint_name + "_oscaler.pkl"
         )
-        self.data_handler.input_data_scaler.save(iscaler_name)
-        self.data_handler.output_data_scaler.save(oscaler_name)
+        self._data_handler.input_data_scaler.save(iscaler_name)
+        self._data_handler.output_data_scaler.save(oscaler_name)
 
         # For the parameters we have to make sure we choose the correct
         # format.
-        if self.use_pkl_checkpoints:
+        if self._use_pkl_checkpoints:
             param_name = (
                 self.params.hyperparameters.checkpoint_name + "_params.pkl"
             )
@@ -198,7 +203,6 @@ def checkpoint_exists(cls, checkpoint_name, use_pkl_checkpoints=False):
         -------
         checkpoint_exists : bool
             True if the checkpoint exists, False otherwise.
-
         """
         iscaler_name = checkpoint_name + "_iscaler.pkl"
         oscaler_name = checkpoint_name + "_oscaler.pkl"
diff --git a/mala/network/hyper_opt_naswot.py b/mala/network/hyper_opt_naswot.py
index 9a11e1ca0..0d57bedbf 100644
--- a/mala/network/hyper_opt_naswot.py
+++ b/mala/network/hyper_opt_naswot.py
@@ -2,8 +2,9 @@
 
 import itertools
 
-import optuna
+from functools import cached_property
 import numpy as np
+import optuna
 
 from mala.common.parallelizer import (
     printout,
@@ -11,6 +12,7 @@
     get_size,
     get_comm,
     barrier,
+    parallel_warn,
 )
 from mala.network.hyper_opt import HyperOpt
 from mala.network.objective_naswot import ObjectiveNASWOT
@@ -33,11 +35,10 @@ class HyperOptNASWOT(HyperOpt):
 
     def __init__(self, params, data):
         super(HyperOptNASWOT, self).__init__(params, data)
-        self.objective = None
-        self.trial_losses = None
-        self.best_trial = None
-        self.trial_list = None
-        self.ignored_hyperparameters = [
+        self._objective = None
+        self._trial_losses = None
+        self._trial_list = None
+        self._ignored_hyperparameters = [
             "learning_rate",
             "optimizer",
             "mini_batch_size",
@@ -47,8 +48,68 @@ def __init__(self, params, data):
         ]
 
         # For parallelization.
-        self.first_trial = None
-        self.last_trial = None
+        self._first_trial = None
+        self._last_trial = None
+
+    @property
+    def best_trial_index(self):
+        """
+        Get the index and loss of best trial determined in this NASWOT run.
+
+        This property is read only, and will be recomputed.
+
+        Returns
+        -------
+        best_trial_index : list
+            A list containing [0] the best trial index and [1] the best
+            trial loss.
+        """
+        if self._trial_losses is None:
+            parallel_warn(
+                "Trial list is not yet computed, cannot determine "
+                "best trial."
+            )
+            return [-1, np.inf]
+
+        if self.params.use_mpi:
+            comm = get_comm()
+            local_result = np.array(
+                [
+                    float(np.argmax(self._trial_losses) + self._first_trial),
+                    np.max(self._trial_losses),
+                ]
+            )
+            all_results = comm.allgather(local_result)
+            max_on_node = np.argmax(np.array(all_results)[:, 1])
+            return [
+                int(all_results[max_on_node][0]),
+                all_results[max_on_node][1],
+            ]
+        else:
+            return [np.argmax(self._trial_losses), np.max(self._trial_losses)]
+
+    @best_trial_index.setter
+    def best_trial_index(self, value):
+        pass
+
+    @property
+    def best_trial(self):
+        """
+        Get the best trial determined in this NASWOT run.
+
+        This property is read only, and will be recomputed.
+        """
+        if self._trial_losses is None:
+            parallel_warn(
+                "Trial list is not yet computed, cannot determine "
+                "best trial."
+            )
+            return None
+        return self._trial_list[self.best_trial_index[0]]
+
+    @best_trial.setter
+    def best_trial(self, value):
+        pass
 
     def perform_study(self, trial_list=None):
         """
@@ -62,6 +123,11 @@ def perform_study(self, trial_list=None):
         ----------
         trial_list : list
             A list containing trials from either HyperOptOptuna or HyperOptOAT.
+
+        Returns
+        -------
+        best_trial_loss : float
+            Loss of the best trial.
         """
         # The minibatch size can not vary in the analysis.
         # This check ensures that e.g. optuna results can be used.
@@ -76,29 +142,29 @@ def perform_study(self, trial_list=None):
 
         # Ideally, this type of HO is called with a list of trials for which
         # the parameter has to be identified.
-        self.trial_list = trial_list
-        if self.trial_list is None:
+        self._trial_list = trial_list
+        if self._trial_list is None:
             printout(
                 "No trial list provided, one will be created using all "
                 "possible permutations of hyperparameters. "
                 "The following hyperparameters will be ignored:",
                 min_verbosity=0,
             )
-            printout(self.ignored_hyperparameters)
+            printout(self._ignored_hyperparameters)
 
             # Please note for the parallel case: The trial list returned
             # here is deterministic.
-            self.trial_list = self.__all_combinations()
+            self._trial_list = self.__all_combinations()
 
         if self.params.use_mpi:
             trials_per_rank = int(
-                np.floor((len(self.trial_list) / get_size()))
+                np.floor((len(self._trial_list) / get_size()))
             )
-            self.first_trial = get_rank() * trials_per_rank
-            self.last_trial = (get_rank() + 1) * trials_per_rank
+            self._first_trial = get_rank() * trials_per_rank
+            self._last_trial = (get_rank() + 1) * trials_per_rank
             if get_size() == get_rank() + 1:
-                trials_per_rank += len(self.trial_list) % get_size()
-                self.last_trial += len(self.trial_list) % get_size()
+                trials_per_rank += len(self._trial_list) % get_size()
+                self._last_trial += len(self._trial_list) % get_size()
 
             # We currently do not support checkpointing in parallel mode
             # for performance reasons.
@@ -109,78 +175,58 @@ def perform_study(self, trial_list=None):
                 )
                 self.params.hyperparameters.checkpoints_each_trial = 0
         else:
-            self.first_trial = 0
-            self.last_trial = len(self.trial_list)
+            self._first_trial = 0
+            self._last_trial = len(self._trial_list)
 
         # TODO: For now. Needs some refinements later.
         if isinstance(
-            self.trial_list[0], optuna.trial.FrozenTrial
-        ) or isinstance(self.trial_list[0], optuna.trial.FixedTrial):
+            self._trial_list[0], optuna.trial.FrozenTrial
+        ) or isinstance(self._trial_list[0], optuna.trial.FixedTrial):
             trial_type = "optuna"
         else:
             trial_type = "oat"
-        self.objective = ObjectiveNASWOT(
-            self.params, self.data_handler, trial_type
+        self._objective = ObjectiveNASWOT(
+            self.params, self._data_handler, trial_type
         )
         printout(
             "Starting NASWOT hyperparameter optimization,",
-            len(self.trial_list),
+            len(self._trial_list),
             "trials will be performed.",
             min_verbosity=0,
         )
 
-        self.trial_losses = []
+        self._trial_losses = []
         for idx, row in enumerate(
-            self.trial_list[self.first_trial : self.last_trial]
+            self._trial_list[self._first_trial : self._last_trial]
         ):
-            trial_loss = self.objective(row)
-            self.trial_losses.append(trial_loss)
+            trial_loss = self._objective(row)
+            self._trial_losses.append(trial_loss)
 
             # Output diagnostic information.
             if self.params.use_mpi:
                 print(
                     "Trial number",
-                    idx + self.first_trial,
+                    idx + self._first_trial,
                     "finished with:",
-                    self.trial_losses[idx],
+                    self._trial_losses[idx],
                 )
             else:
-                best_trial = self.get_best_trial_results()
                 printout(
                     "Trial number",
                     idx,
                     "finished with:",
-                    self.trial_losses[idx],
+                    self._trial_losses[idx],
                     ", best is trial",
-                    best_trial[0],
+                    self.best_trial_index[0],
                     "with",
-                    best_trial[1],
+                    self.best_trial_index[1],
                     min_verbosity=0,
                 )
 
         barrier()
 
         # Return the best loss value we could achieve.
-        return self.get_best_trial_results()[1]
-
-    def get_best_trial_results(self):
-        """Get the best trial out of the list, including the value."""
-        if self.params.use_mpi:
-            comm = get_comm()
-            local_result = np.array(
-                [
-                    float(np.argmax(self.trial_losses) + self.first_trial),
-                    np.max(self.trial_losses),
-                ]
-            )
-            all_results = comm.allgather(local_result)
-            max_on_node = np.argmax(np.array(all_results)[:, 1])
-            return [
-                int(all_results[max_on_node][0]),
-                all_results[max_on_node][1],
-            ]
-        else:
-            return [np.argmax(self.trial_losses), np.max(self.trial_losses)]
+        return self.best_trial_index[1]
 
     def set_optimal_parameters(self):
         """
@@ -189,29 +235,13 @@ def set_optimal_parameters(self):
         The parameters will be written to the parameter object with which the
         hyperparameter optimizer was created.
         """
-        # Getting the best trial based on the test errors
-        if self.params.use_mpi:
-            comm = get_comm()
-            local_result = np.array(
-                [
-                    float(np.argmax(self.trial_losses) + self.first_trial),
-                    np.max(self.trial_losses),
-                ]
-            )
-            all_results = comm.allgather(local_result)
-            max_on_node = np.argmax(np.array(all_results)[:, 1])
-            idx = int(all_results[max_on_node][0])
-        else:
-            idx = self.trial_losses.index(max(self.trial_losses))
-
-        self.best_trial = self.trial_list[idx]
-        self.objective.parse_trial(self.best_trial)
+        self._objective.parse_trial(self.best_trial)
 
     def __all_combinations(self):
         # First, remove all the hyperparameters we don't actually need.
         indices_to_remove = []
         for idx, par in enumerate(self.params.hyperparameters.hlist):
-            if par.name in self.ignored_hyperparameters:
+            if par.name in self._ignored_hyperparameters:
                 indices_to_remove.append(idx)
         for index in sorted(indices_to_remove, reverse=True):
             del self.params.hyperparameters.hlist[index]
diff --git a/mala/network/hyper_opt_oat.py b/mala/network/hyper_opt_oat.py
index 674cbed6f..4642320db 100644
--- a/mala/network/hyper_opt_oat.py
+++ b/mala/network/hyper_opt_oat.py
@@ -14,7 +14,7 @@
 from mala.network.hyper_opt import HyperOpt
 from mala.network.objective_base import ObjectiveBase
 from mala.network.hyperparameter_oat import HyperparameterOAT
-from mala.common.parallelizer import printout
+from mala.common.parallelizer import printout, parallel_warn
 
 
 class HyperOptOAT(HyperOpt):
@@ -38,22 +38,55 @@ def __init__(self, params, data, use_pkl_checkpoints=False):
         super(HyperOptOAT, self).__init__(
             params, data, use_pkl_checkpoints=use_pkl_checkpoints
         )
-        self.objective = None
-        self.optimal_params = None
-        self.checkpoint_counter = 0
+        self._objective = None
+        self._optimal_params = None
+        self._checkpoint_counter = 0
 
         # Related to the OA itself.
-        self.importance = None
-        self.n_factors = None
-        self.factor_levels = None
-        self.strength = None
-        self.N_runs = None
+        self._importance = None
+        self._n_factors = None
+        self._factor_levels = None
+        self._strength = None
+        self._N_runs = None
         self.__OA = None
 
         # Tracking the trial progress.
-        self.sorted_num_choices = []
-        self.current_trial = 0
-        self.trial_losses = None
+        self._sorted_num_choices = []
+        self._current_trial = 0
+        self._trial_losses = None
+
+    @property
+    def best_trial_index(self):
+        """
+        Get the index and loss of best trial determined in this NASWOT run.
+
+        This property is read only, and will be recomputed.
+
+        Returns
+        -------
+        best_trial_index : list
+            A list containing [0] the best trial index and [1] the best
+            trial loss.
+        """
+        if self._trial_losses is None:
+            parallel_warn(
+                "Trial list is not yet computed, cannot determine "
+                "best trial."
+            )
+            return [-1, np.inf]
+
+        if self.params.hyperparameters.direction == "minimize":
+            return [np.argmin(self._trial_losses), np.min(self._trial_losses)]
+        elif self.params.hyperparameters.direction == "maximize":
+            return [np.argmax(self._trial_losses), np.max(self._trial_losses)]
+        else:
+            raise Exception(
+                "Invalid direction for hyperparameter optimization selected."
+            )
+
+    @best_trial_index.setter
+    def best_trial_index(self, value):
+        pass
 
     def add_hyperparameter(
         self, opttype="categorical", name="", choices=None, **kwargs
@@ -70,15 +103,15 @@ def add_hyperparameter(
             Datatype of the hyperparameter. Follows optuna's naming
             conventions, but currently only supports "categorical" (a list).
         """
-        if not self.sorted_num_choices:  # if empty
+        if not self._sorted_num_choices:  # if empty
             super(HyperOptOAT, self).add_hyperparameter(
                 opttype=opttype, name=name, choices=choices
             )
-            self.sorted_num_choices.append(len(choices))
+            self._sorted_num_choices.append(len(choices))
 
         else:
-            index = bisect(self.sorted_num_choices, len(choices))
-            self.sorted_num_choices.insert(index, len(choices))
+            index = bisect(self._sorted_num_choices, len(choices))
+            self._sorted_num_choices.insert(index, len(choices))
             self.params.hyperparameters.hlist.insert(
                 index,
                 HyperparameterOAT(opttype=opttype, name=name, choices=choices),
@@ -88,50 +121,50 @@ def perform_study(self):
         """
         Perform the study, i.e. the optimization.
 
-        Uses Optunas TPE sampler.
+        Internally constructs an orthogonal array and performs trial NN
+        trainings based on it.
         """
         if self.__OA is None:
-            self.__OA = self.get_orthogonal_array()
+            self.__OA = self._get_orthogonal_array()
         print(self.__OA)
-        if self.trial_losses is None:
-            self.trial_losses = np.zeros(self.__OA.shape[0]) + float("inf")
+        if self._trial_losses is None:
+            self._trial_losses = np.zeros(self.__OA.shape[0]) + float("inf")
 
         printout(
             "Performing",
-            self.N_runs,
+            self._N_runs,
             "trials, starting with trial number",
-            self.current_trial,
+            self._current_trial,
             min_verbosity=0,
         )
 
         # The parameters could have changed.
-        self.objective = ObjectiveBase(self.params, self.data_handler)
+        self._objective = ObjectiveBase(self.params, self._data_handler)
 
         # Iterate over the OA and perform the trials.
-        for i in range(self.current_trial, self.N_runs):
+        for i in range(self._current_trial, self._N_runs):
             row = self.__OA[i]
-            self.trial_losses[self.current_trial] = self.objective(row)
+            self._trial_losses[self._current_trial] = self._objective(row)
 
             # Output diagnostic information.
-            best_trial = self.get_best_trial_results()
             printout(
                 "Trial number",
-                self.current_trial,
+                self._current_trial,
                 "finished with:",
-                self.trial_losses[self.current_trial],
+                self._trial_losses[self._current_trial],
                 ", best is trial",
-                best_trial[0],
+                self.best_trial_index[0],
                 "with",
-                best_trial[1],
+                self.best_trial_index[1],
                 min_verbosity=0,
             )
-            self.current_trial += 1
+            self._current_trial += 1
             self.__create_checkpointing(row)
 
         # Perform Range Analysis
-        self.get_optimal_parameters()
+        self._range_analysis()
 
-    def get_optimal_parameters(self):
+    def _range_analysis(self):
         """
         Find the optimal set of hyperparameters by doing range analysis.
 
@@ -143,15 +176,15 @@ def indices(idx, val):
             return np.where(self.__OA[:, idx] == val)[0]
 
         R = [
-            [self.trial_losses[indices(idx, l)].sum() for l in range(levels)]
-            for (idx, levels) in enumerate(self.factor_levels)
+            [self._trial_losses[indices(idx, l)].sum() for l in range(levels)]
+            for (idx, levels) in enumerate(self._factor_levels)
         ]
 
         A = [[i / len(j) for i in j] for j in R]
 
         # Taking loss as objective to minimise
-        self.optimal_params = np.array([i.index(min(i)) for i in A])
-        self.importance = np.argsort([max(i) - min(i) for i in A])
+        self._optimal_params = np.array([i.index(min(i)) for i in A])
+        self._importance = np.argsort([max(i) - min(i) for i in A])
 
     def show_order_of_importance(self):
         """Print the order of importance of the hyperparameters."""
@@ -159,7 +192,7 @@ def show_order_of_importance(self):
         printout(
             *[
                 self.params.hyperparameters.hlist[idx].name
-                for idx in self.importance
+                for idx in self._importance
             ],
             sep=" < ",
             min_verbosity=0
@@ -172,23 +205,23 @@ def set_optimal_parameters(self):
         The parameters will be written to the parameter object with which the
         hyperparameter optimizer was created.
         """
-        self.objective.parse_trial_oat(self.optimal_params)
+        self._objective.parse_trial_oat(self._optimal_params)
 
-    def get_orthogonal_array(self):
+    def _get_orthogonal_array(self):
         """
         Generate the best OA used for optimal hyperparameter sampling.
 
         This is function is taken from the example notebook of OApackage.
         """
         self.__check_factor_levels()
-        print("Sorted factor levels:", self.sorted_num_choices)
-        self.n_factors = len(self.params.hyperparameters.hlist)
+        print("Sorted factor levels:", self._sorted_num_choices)
+        self._n_factors = len(self.params.hyperparameters.hlist)
 
-        self.factor_levels = [
+        self._factor_levels = [
             par.num_choices for par in self.params.hyperparameters.hlist
         ]
 
-        self.strength = 2
+        self._strength = 2
         arraylist = None
 
         # This is a little bit hacky.
@@ -200,11 +233,14 @@ def get_orthogonal_array(self):
         # holds. x is unknown, but we can be confident that it should be
         # small. So simply trying 3 time should be fine for now.
         for i in range(1, 4):
-            self.N_runs = self.number_of_runs() * i
-            print("Trying run size:", self.N_runs)
+            self._N_runs = self._number_of_runs() * i
+            print("Trying run size:", self._N_runs)
             print("Generating Suitable Orthogonal Array.")
             arrayclass = oa.arraydata_t(
-                self.factor_levels, self.N_runs, self.strength, self.n_factors
+                self._factor_levels,
+                self._N_runs,
+                self._strength,
+                self._n_factors,
             )
             arraylist = [arrayclass.create_root()]
 
@@ -212,7 +248,7 @@ def get_orthogonal_array(self):
             options = oa.OAextend()
             options.setAlgorithmAuto(arrayclass)
 
-            for _ in range(self.strength + 1, self.n_factors + 1):
+            for _ in range(self._strength + 1, self._n_factors + 1):
                 arraylist_extensions = oa.extend_arraylist(
                     arraylist, arrayclass, options
                 )
@@ -231,7 +267,7 @@ def get_orthogonal_array(self):
         else:
             return np.unique(np.array(arraylist[0]), axis=0)
 
-    def number_of_runs(self):
+    def _number_of_runs(self):
         """
         Calculate the minimum number of runs required for an Orthogonal array.
 
@@ -241,29 +277,20 @@ def number_of_runs(self):
         """
         runs = [
             np.prod(tt)
-            for tt in itertools.combinations(self.factor_levels, self.strength)
+            for tt in itertools.combinations(
+                self._factor_levels, self._strength
+            )
         ]
 
         N = np.lcm.reduce(runs)
         return int(N)
 
-    def get_best_trial_results(self):
-        """Get the best trial out of the list, including the value."""
-        if self.params.hyperparameters.direction == "minimize":
-            return [np.argmin(self.trial_losses), np.min(self.trial_losses)]
-        elif self.params.hyperparameters.direction == "maximize":
-            return [np.argmax(self.trial_losses), np.max(self.trial_losses)]
-        else:
-            raise Exception(
-                "Invalid direction for hyperparameter optimization selected."
-            )
-
     def __check_factor_levels(self):
         """Check that the factors are in a decreasing order."""
-        dx = np.diff(self.sorted_num_choices)
+        dx = np.diff(self._sorted_num_choices)
         if np.all(dx >= 0):
             # Factors in increasing order, we have to reverse the order.
-            self.sorted_num_choices.reverse()
+            self._sorted_num_choices.reverse()
             self.params.hyperparameters.hlist.reverse()
         elif np.all(dx <= 0):
             # Factors are in decreasing order, we don't have to do anything.
@@ -348,31 +375,33 @@ def load_from_file(cls, params, file_path, data):
         with open(file_path, "rb") as handle:
             loaded_tracking_data = pickle.load(handle)
             loaded_hyperopt = HyperOptOAT(params, data)
-            loaded_hyperopt.sorted_num_choices = loaded_tracking_data[
+            loaded_hyperopt._sorted_num_choices = loaded_tracking_data[
                 "sorted_num_choices"
             ]
-            loaded_hyperopt.current_trial = loaded_tracking_data[
+            loaded_hyperopt._current_trial = loaded_tracking_data[
                 "current_trial"
             ]
-            loaded_hyperopt.trial_losses = loaded_tracking_data["trial_losses"]
-            loaded_hyperopt.importance = loaded_tracking_data["importance"]
-            loaded_hyperopt.n_factors = loaded_tracking_data["n_factors"]
-            loaded_hyperopt.factor_levels = loaded_tracking_data[
+            loaded_hyperopt._trial_losses = loaded_tracking_data[
+                "trial_losses"
+            ]
+            loaded_hyperopt._importance = loaded_tracking_data["importance"]
+            loaded_hyperopt._n_factors = loaded_tracking_data["n_factors"]
+            loaded_hyperopt._factor_levels = loaded_tracking_data[
                 "factor_levels"
             ]
-            loaded_hyperopt.strength = loaded_tracking_data["strength"]
-            loaded_hyperopt.N_runs = loaded_tracking_data["N_runs"]
+            loaded_hyperopt._strength = loaded_tracking_data["strength"]
+            loaded_hyperopt._N_runs = loaded_tracking_data["N_runs"]
             loaded_hyperopt.__OA = loaded_tracking_data["OA"]
 
         return loaded_hyperopt
 
     def __create_checkpointing(self, trial):
         """Create a checkpoint of optuna study, if necessary."""
-        self.checkpoint_counter += 1
+        self._checkpoint_counter += 1
         need_to_checkpoint = False
 
         if (
-            self.checkpoint_counter
+            self._checkpoint_counter
             >= self.params.hyperparameters.checkpoints_each_trial
             and self.params.hyperparameters.checkpoints_each_trial > 0
         ):
@@ -386,12 +415,12 @@ def __create_checkpointing(self, trial):
             )
         if (
             self.params.hyperparameters.checkpoints_each_trial < 0
-            and np.argmin(self.trial_losses) == self.current_trial - 1
+            and np.argmin(self._trial_losses) == self._current_trial - 1
         ):
             need_to_checkpoint = True
             printout(
                 "Best trial is "
-                + str(self.current_trial - 1)
+                + str(self._current_trial - 1)
                 + ", creating a "
                 "checkpoint for it.",
                 min_verbosity=1,
@@ -399,7 +428,7 @@ def __create_checkpointing(self, trial):
 
         if need_to_checkpoint is True:
             # We need to create a checkpoint!
-            self.checkpoint_counter = 0
+            self._checkpoint_counter = 0
 
             self._save_params_and_scaler()
 
@@ -411,14 +440,14 @@ def __create_checkpointing(self, trial):
                 )
 
                 study = {
-                    "sorted_num_choices": self.sorted_num_choices,
-                    "current_trial": self.current_trial,
-                    "trial_losses": self.trial_losses,
-                    "importance": self.importance,
-                    "n_factors": self.n_factors,
-                    "factor_levels": self.factor_levels,
-                    "strength": self.strength,
-                    "N_runs": self.N_runs,
+                    "sorted_num_choices": self._sorted_num_choices,
+                    "current_trial": self._current_trial,
+                    "trial_losses": self._trial_losses,
+                    "importance": self._importance,
+                    "n_factors": self._n_factors,
+                    "factor_levels": self._factor_levels,
+                    "strength": self._strength,
+                    "N_runs": self._N_runs,
                     "OA": self.__OA,
                 }
                 with open(hyperopt_name, "wb") as handle:
diff --git a/mala/network/hyper_opt_optuna.py b/mala/network/hyper_opt_optuna.py
index 10d9a21ea..623c7415c 100644
--- a/mala/network/hyper_opt_optuna.py
+++ b/mala/network/hyper_opt_optuna.py
@@ -25,6 +25,18 @@ class HyperOptOptuna(HyperOpt):
 
     use_pkl_checkpoints : bool
         If true, .pkl checkpoints will be created.
+
+    Attributes
+    ----------
+    params : mala.common.parameters.Parameters
+        MALA Parameters object.
+
+    objective : mala.network.objective_base.ObjectiveBase
+        MALA objective to be optimized, i.e., a MALA NN model training.
+
+    study : optuna.study.Study
+        An Optuna study used to collect the results of the hyperparameter
+        optimization.
     """
 
     def __init__(self, params, data, use_pkl_checkpoints=False):
@@ -93,7 +105,7 @@ def __init__(self, params, data, use_pkl_checkpoints=False):
                 load_if_exists=True,
                 pruner=pruner,
             )
-        self.checkpoint_counter = 0
+        self._checkpoint_counter = 0
 
     def perform_study(self):
         """
@@ -101,9 +113,14 @@ def perform_study(self):
 
         This is done by sampling a certain subset of network architectures.
         In this case, optuna is used.
+
+        Returns
+        -------
+        best_trial_loss : float
+            Loss of the best trial.
         """
         # The parameters could have changed.
-        self.objective = ObjectiveBase(self.params, self.data_handler)
+        self.objective = ObjectiveBase(self.params, self._data_handler)
 
         # Fill callback list based on user checkpoint wishes.
         callback_list = [self.__check_stopping]
@@ -131,6 +148,8 @@ def get_trials_from_study(self):
         """
         Return the trials from the last study.
 
+        Only returns completed trials.
+
         Returns
         -------
         last_trials: list
@@ -350,11 +369,11 @@ def __check_stopping(self, study, trial):
 
     def __create_checkpointing(self, study, trial):
         """Create a checkpoint of optuna study, if necessary."""
-        self.checkpoint_counter += 1
+        self._checkpoint_counter += 1
         need_to_checkpoint = False
 
         if (
-            self.checkpoint_counter
+            self._checkpoint_counter
             >= self.params.hyperparameters.checkpoints_each_trial
             and self.params.hyperparameters.checkpoints_each_trial > 0
         ):
@@ -380,7 +399,7 @@ def __create_checkpointing(self, study, trial):
 
         if need_to_checkpoint is True:
             # We need to create a checkpoint!
-            self.checkpoint_counter = 0
+            self._checkpoint_counter = 0
 
             self._save_params_and_scaler()
 
diff --git a/test/complete_interfaces_test.py b/test/complete_interfaces_test.py
index 300d6302f..2d4831e4f 100644
--- a/test/complete_interfaces_test.py
+++ b/test/complete_interfaces_test.py
@@ -251,7 +251,7 @@ def test_ase_calculator(self):
             reference_data=os.path.join(data_path, "Be_snapshot1.out"),
         )
         total_energy_dft_calculation = (
-            calculator.data_handler.target_calculator.total_energy_dft_calculation
+            calculator._data_handler.target_calculator.total_energy_dft_calculation
         )
         calculator.calculate(atoms, properties=["energy"])
         assert np.isclose(
diff --git a/test/hyperopt_test.py b/test/hyperopt_test.py
index 77b0b9896..a04632035 100644
--- a/test/hyperopt_test.py
+++ b/test/hyperopt_test.py
@@ -294,7 +294,7 @@ def test_naswot_eigenvalues(self):
         for idx, trial in enumerate(correct_trial_list):
             assert np.isclose(
                 trial,
-                test_hp_optimizer.trial_losses[idx],
+                test_hp_optimizer._trial_losses[idx],
                 rtol=naswot_accuracy,
             )
 
diff --git a/test/inference_test.py b/test/inference_test.py
index 84e0e9cca..956410cc7 100644
--- a/test/inference_test.py
+++ b/test/inference_test.py
@@ -33,7 +33,7 @@ def test_unit_conversion(self):
 
         # Confirm that unit conversion does not introduce any errors.
 
-        from_file_1 = data_handler.target_calculator.convert_units(
+        from_file_1 = data_handler._target_calculator.convert_units(
             np.load(
                 os.path.join(data_path, "Be_snapshot" + str(0) + ".out.npy")
             ),
@@ -41,7 +41,7 @@ def test_unit_conversion(self):
         )
         from_file_2 = np.load(
             os.path.join(data_path, "Be_snapshot" + str(0) + ".out.npy")
-        ) * data_handler.target_calculator.convert_units(
+        ) * data_handler._target_calculator.convert_units(
             1, in_units="1/(eV*Bohr^3)"
         )
 

From 9a351bccbaa976cb7d617f32ce179c67747cfbae Mon Sep 17 00:00:00 2001
From: Lenz Fiedler <l.fiedler@hzdr.de>
Date: Mon, 25 Nov 2024 17:03:40 +0100
Subject: [PATCH 13/21] Finished model and running classes

---
 examples/advanced/ex03_tensor_board.py   |  12 +-
 mala/datahandling/fast_tensor_dataset.py |   1 -
 mala/network/hyperparameter.py           |  31 ++-
 mala/network/network.py                  |  62 +++++-
 mala/network/objective_base.py           |  57 +++---
 mala/network/objective_naswot.py         |   6 +-
 mala/network/predictor.py                |  14 +-
 mala/network/runner.py                   |  14 ++
 mala/network/tester.py                   |  34 +++-
 mala/network/trainer.py                  | 242 ++++++++++++-----------
 test/checkpoint_training_test.py         |   4 +-
 test/inference_test.py                   |   4 +-
 12 files changed, 304 insertions(+), 177 deletions(-)

diff --git a/examples/advanced/ex03_tensor_board.py b/examples/advanced/ex03_tensor_board.py
index 97bc781cf..b8e1bf16d 100644
--- a/examples/advanced/ex03_tensor_board.py
+++ b/examples/advanced/ex03_tensor_board.py
@@ -32,11 +32,19 @@
 
 data_handler = mala.DataHandler(parameters)
 data_handler.add_snapshot(
-    "Be_snapshot0.in.npy", data_path, "Be_snapshot0.out.npy", data_path, "tr",
+    "Be_snapshot0.in.npy",
+    data_path,
+    "Be_snapshot0.out.npy",
+    data_path,
+    "tr",
     calculation_output_file=os.path.join(data_path, "Be_snapshot0.out"),
 )
 data_handler.add_snapshot(
-    "Be_snapshot1.in.npy", data_path, "Be_snapshot1.out.npy", data_path, "va",
+    "Be_snapshot1.in.npy",
+    data_path,
+    "Be_snapshot1.out.npy",
+    data_path,
+    "va",
     calculation_output_file=os.path.join(data_path, "Be_snapshot1.out"),
 )
 data_handler.prepare_data()
diff --git a/mala/datahandling/fast_tensor_dataset.py b/mala/datahandling/fast_tensor_dataset.py
index 0f650b56a..50f2679a0 100644
--- a/mala/datahandling/fast_tensor_dataset.py
+++ b/mala/datahandling/fast_tensor_dataset.py
@@ -26,7 +26,6 @@ class FastTensorDataset(torch.utils.data.Dataset):
     """
 
     def __init__(self, batch_size, *tensors):
-        """ """
         super(FastTensorDataset).__init__()
         self.batch_size = batch_size
         self._tensors = tensors
diff --git a/mala/network/hyperparameter.py b/mala/network/hyperparameter.py
index b951c85a5..4294d6a4f 100644
--- a/mala/network/hyperparameter.py
+++ b/mala/network/hyperparameter.py
@@ -44,10 +44,33 @@ class Hyperparameter(JSONSerializable):
     choices : list
         List of possible choices (for categorical parameter).
 
-    Returns
-    -------
-    hyperparameter : HyperparameterOptuna or HyperparameterOAT or HyperparameterNASWOT or HyperparameterACSD
-        Hyperparameter in desired format.
+    Attributes
+    ----------
+    opttype : string
+        Datatype of the hyperparameter. Follows optunas naming convetions.
+        In principle supported are:
+
+            - float
+            - int
+            - categorical (list)
+
+        Float and int are not available for OA based approaches at the
+        moment.
+
+    name : string
+        Name of the hyperparameter. Please note that these names always
+        have to be distinct; if you e.g. want to investigate multiple
+        layer sizes use e.g. ff_neurons_layer_001, ff_neurons_layer_002,
+        etc. as names.
+
+    low : float or int
+        Lower bound for numerical parameter.
+
+    high : float or int
+        Higher bound for numerical parameter.
+
+    choices : list
+        List of possible choices (for categorical parameter).
     """
 
     def __new__(
diff --git a/mala/network/network.py b/mala/network/network.py
index 3835702b9..6a9a5dbe1 100644
--- a/mala/network/network.py
+++ b/mala/network/network.py
@@ -8,7 +8,7 @@
 import torch.nn.functional as functional
 
 from mala.common.parameters import Parameters
-from mala.common.parallelizer import printout
+from mala.common.parallelizer import printout, parallel_warn
 
 
 class Network(nn.Module):
@@ -23,6 +23,23 @@ class Network(nn.Module):
     ----------
     params : mala.common.parametes.Parameters
         Parameters used to create this neural network.
+
+    Attributes
+    ----------
+    loss_func : function
+        Loss function.
+
+    mini_batch_size : int
+        Size of mini batches propagated through network.
+
+    number_of_layers : int
+        Number of NN layers.
+
+    params : mala.common.parametes.ParametersNetwork
+        MALA neural network parameters.
+
+    use_ddp : bool
+        If True, the torch distributed data parallel formalism will be used.
     """
 
     def __new__(cls, params: Parameters):
@@ -78,7 +95,7 @@ def __init__(self, params: Parameters):
         super(Network, self).__init__()
 
         # Mappings for parsing of the activation layers.
-        self.activation_mappings = {
+        self._activation_mappings = {
             "Sigmoid": nn.Sigmoid,
             "ReLU": nn.ReLU,
             "LeakyReLU": nn.LeakyReLU,
@@ -96,12 +113,19 @@ def __init__(self, params: Parameters):
 
     @abstractmethod
     def forward(self, inputs):
-        """Abstract method. To be implemented by the derived class."""
+        """
+        Abstract method. To be implemented by the derived class.
+
+        Parameters
+        ----------
+        inputs : torch.Tensor
+            Torch tensor to be propagated.
+        """
         pass
 
     def do_prediction(self, array):
         """
-        Predict the output values for an input array..
+        Predict the output values for an input array.
 
         Interface to do predictions. The data put in here is assumed to be a
         scaled torch.Tensor and in the right units. Be aware that this will
@@ -143,8 +167,6 @@ def calculate_loss(self, output, target):
         """
         return self.loss_func(output, target)
 
-    # FIXME: This guarentees downwards compatibility, but it is ugly.
-    #  Rather enforce the right package versions in the repo.
     def save_network(self, path_to_file):
         """
         Save the network.
@@ -238,13 +260,13 @@ def __init__(self, params):
             try:
                 if use_only_one_activation_type:
                     self.layers.append(
-                        self.activation_mappings[
+                        self._activation_mappings[
                             self.params.layer_activations[0]
                         ]()
                     )
                 else:
                     self.layers.append(
-                        self.activation_mappings[
+                        self._activation_mappings[
                             self.params.layer_activations[i]
                         ]()
                     )
@@ -281,6 +303,11 @@ class LSTM(Network):
     # was passed to be used in the entire network.
     def __init__(self, params):
         super(LSTM, self).__init__(params)
+        parallel_warn(
+            "The LSTM class will be deprecated in MALA v1.4.0.",
+            0,
+            category=FutureWarning,
+        )
 
         self.hidden_dim = self.params.layer_sizes[-1]
 
@@ -312,7 +339,7 @@ def __init__(self, params):
                 self.params.num_hidden_layers,
                 batch_first=True,
             )
-        self.activation = self.activation_mappings[
+        self.activation = self._activation_mappings[
             self.params.layer_activations[0]
         ]()
 
@@ -417,6 +444,11 @@ class GRU(LSTM):
     # layer as GRU.
     def __init__(self, params):
         Network.__init__(self, params)
+        parallel_warn(
+            "The GRU class will be deprecated in MALA v1.4.0.",
+            0,
+            category=FutureWarning,
+        )
 
         self.hidden_dim = self.params.layer_sizes[-1]
 
@@ -445,7 +477,7 @@ def __init__(self, params):
                 self.params.num_hidden_layers,
                 batch_first=True,
             )
-        self.activation = self.activation_mappings[
+        self.activation = self._activation_mappings[
             self.params.layer_activations[0]
         ]()
 
@@ -536,6 +568,11 @@ class TransformerNet(Network):
 
     def __init__(self, params):
         super(TransformerNet, self).__init__(params)
+        parallel_warn(
+            "The TransformerNet class will be deprecated in MALA v1.4.0.",
+            0,
+            category=FutureWarning,
+        )
 
         # Adjust number of heads.
         if self.params.layer_sizes[0] % self.params.num_heads != 0:
@@ -637,6 +674,11 @@ class PositionalEncoding(nn.Module):
     """
 
     def __init__(self, d_model, dropout=0.1, max_len=400):
+        parallel_warn(
+            "The PositionalEncoding class will be deprecated in MALA v1.4.0.",
+            0,
+            category=FutureWarning,
+        )
         super(PositionalEncoding, self).__init__()
         self.dropout = nn.Dropout(p=dropout)
 
diff --git a/mala/network/objective_base.py b/mala/network/objective_base.py
index c90916935..539820f8e 100644
--- a/mala/network/objective_base.py
+++ b/mala/network/objective_base.py
@@ -16,22 +16,19 @@ class ObjectiveBase:
     Represents the objective function of a training process.
 
     This is usually the result of a training of a network.
-    """
 
-    def __init__(self, params, data_handler):
-        """
-        Create an ObjectiveBase object.
+    Parameters
+    ----------
+    params : mala.common.parametes.Parameters
+        Parameters used to create this objective.
 
-        Parameters
-        ----------
-        params : mala.common.parametes.Parameters
-            Parameters used to create this objective.
+    data_handler : mala.datahandling.data_handler.DataHandler
+        datahandler to be used during the hyperparameter optimization.
+    """
 
-        data_handler : mala.datahandling.data_handler.DataHandler
-            datahandler to be used during the hyperparameter optimization.
-        """
+    def __init__(self, params, data_handler):
         self.params: Parameters = params
-        self.data_handler = data_handler
+        self._data_handler = data_handler
 
         # We need to find out if we have to reparametrize the lists with the
         # layers and the activations.
@@ -59,17 +56,17 @@ def __init__(self, params, data_handler):
                 "the range of neurons or number of layers is missing. "
                 "This input will be ignored."
             )
-        self.optimize_layer_list = contains_single_layer or (
+        self._optimize_layer_list = contains_single_layer or (
             contains_multiple_layer_neurons and contains_multiple_layers_count
         )
-        self.optimize_activation_list = list(
+        self._optimize_activation_list = list(
             map(
                 lambda p: "layer_activation" in p.name,
                 self.params.hyperparameters.hlist,
             )
         ).count(True)
 
-        self.trial_type = self.params.hyperparameters.hyper_opt_method
+        self._trial_type = self.params.hyperparameters.hyper_opt_method
 
     def __call__(self, trial):
         """
@@ -84,7 +81,7 @@ def __call__(self, trial):
         # Parse the parameters included in the trial.
         self.parse_trial(trial)
         if (
-            self.trial_type == "optuna"
+            self._trial_type == "optuna"
             and self.params.hyperparameters.pruner == "naswot"
         ):
             if trial.should_prune():
@@ -97,12 +94,12 @@ def __call__(self, trial):
         ):
             test_network = Network(self.params)
             test_trainer = Trainer(
-                self.params, test_network, self.data_handler
+                self.params, test_network, self._data_handler
             )
             test_trainer.train_network()
             final_validation_loss.append(test_trainer.final_validation_loss)
             if (
-                self.trial_type == "optuna"
+                self._trial_type == "optuna"
                 and self.params.hyperparameters.pruner == "multi_training"
             ):
 
@@ -149,9 +146,9 @@ def parse_trial(self, trial):
             A trial is a set of hyperparameters; can be an optuna based
             trial or simply a OAT compatible list.
         """
-        if self.trial_type == "optuna":
+        if self._trial_type == "optuna":
             self.parse_trial_optuna(trial)
-        elif self.trial_type == "oat":
+        elif self._trial_type == "oat":
             self.parse_trial_oat(trial)
         else:
             raise Exception(
@@ -168,11 +165,11 @@ def parse_trial_optuna(self, trial: Trial):
         trial : optuna.trial.Trial.
             A set of hyperparameters encoded by optuna.
         """
-        if self.optimize_layer_list:
+        if self._optimize_layer_list:
             self.params.network.layer_sizes = [
-                self.data_handler.input_dimension
+                self._data_handler.input_dimension
             ]
-        if self.optimize_activation_list > 0:
+        if self._optimize_activation_list > 0:
             self.params.network.layer_activations = []
 
         # Some layers may have been turned off by optuna.
@@ -275,9 +272,9 @@ def parse_trial_optuna(self, trial: Trial):
                     )
                 layer_counter += 1
 
-        if self.optimize_layer_list:
+        if self._optimize_layer_list:
             self.params.network.layer_sizes.append(
-                self.data_handler.output_dimension
+                self._data_handler.output_dimension
             )
 
     def parse_trial_oat(self, trial):
@@ -289,12 +286,12 @@ def parse_trial_oat(self, trial):
         trial : numpy.array
             Row in an orthogonal array which respresents current trial.
         """
-        if self.optimize_layer_list:
+        if self._optimize_layer_list:
             self.params.network.layer_sizes = [
-                self.data_handler.input_dimension
+                self._data_handler.input_dimension
             ]
 
-        if self.optimize_activation_list:
+        if self._optimize_activation_list:
             self.params.network.layer_activations = []
 
         # Some layers may have been turned off by optuna.
@@ -405,7 +402,7 @@ def parse_trial_oat(self, trial):
                     )
                 layer_counter += 1
 
-        if self.optimize_layer_list:
+        if self._optimize_layer_list:
             self.params.network.layer_sizes.append(
-                self.data_handler.output_dimension
+                self._data_handler.output_dimension
             )
diff --git a/mala/network/objective_naswot.py b/mala/network/objective_naswot.py
index 96377e527..56108211d 100644
--- a/mala/network/objective_naswot.py
+++ b/mala/network/objective_naswot.py
@@ -75,14 +75,14 @@ def __call__(self, trial):
             # Load the batchesand get the jacobian.
             do_shuffle = self.params.running.use_shuffling_for_samplers
             if (
-                self.data_handler.parameters.use_lazy_loading
+                self._data_handler.parameters.use_lazy_loading
                 or self.params.use_ddp
             ):
                 do_shuffle = False
             if self.params.running.use_shuffling_for_samplers:
-                self.data_handler.mix_datasets()
+                self._data_handler.mix_datasets()
             loader = DataLoader(
-                self.data_handler.training_data_sets[0],
+                self._data_handler.training_data_sets[0],
                 batch_size=self.batch_size,
                 shuffle=do_shuffle,
             )
diff --git a/mala/network/predictor.py b/mala/network/predictor.py
index 440929906..3dfc99177 100644
--- a/mala/network/predictor.py
+++ b/mala/network/predictor.py
@@ -26,6 +26,12 @@ class Predictor(Runner):
     data : mala.datahandling.data_handler.DataHandler
         DataHandler, in this case not directly holding data, but serving
         as an interface to Target and Descriptor objects.
+
+    Attributes
+    ----------
+    target_calculator : mala.targets.target.Target
+        Target calculator used for predictions. Can be used for further
+        processing.
     """
 
     def __init__(self, params, network, data):
@@ -37,8 +43,8 @@ def __init__(self, params, network, data):
             * self.data.grid_dimension[1]
             * self.data.grid_dimension[2]
         )
-        self.test_data_loader = None
-        self.number_of_batches_per_snapshot = 0
+        self._test_data_loader = None
+        self._number_of_batches_per_snapshot = 0
         self.target_calculator = data.target_calculator
 
     def predict_from_qeout(self, path_to_file, gather_ldos=False):
@@ -228,11 +234,11 @@ def _forward_snap_descriptors(
                 )
                 self.parameters.mini_batch_size = optimal_batch_size
 
-            self.number_of_batches_per_snapshot = int(
+            self._number_of_batches_per_snapshot = int(
                 local_data_size / self.parameters.mini_batch_size
             )
 
-            for i in range(0, self.number_of_batches_per_snapshot):
+            for i in range(0, self._number_of_batches_per_snapshot):
                 sl = slice(
                     i * self.parameters.mini_batch_size,
                     (i + 1) * self.parameters.mini_batch_size,
diff --git a/mala/network/runner.py b/mala/network/runner.py
index 9daf32f6a..c4bfa6f0d 100644
--- a/mala/network/runner.py
+++ b/mala/network/runner.py
@@ -38,6 +38,20 @@ class Runner:
     network : mala.network.network.Network
         Network which is being run.
 
+    data : mala.datahandling.data_handler.DataHandler
+        DataHandler holding the data for the run.
+
+    Attributes
+    ----------
+    parameters : mala.common.parametes.ParametersRunning
+        MALA neural network training/inference parameters.
+
+    parameters_full : mala.common.parametes.Parameters
+        Full MALA Parameters object.
+
+    network : mala.network.network.Network
+        Network which is being run.
+
     data : mala.datahandling.data_handler.DataHandler
         DataHandler holding the data for the run.
     """
diff --git a/mala/network/tester.py b/mala/network/tester.py
index fa1a27190..d7c07761a 100644
--- a/mala/network/tester.py
+++ b/mala/network/tester.py
@@ -41,6 +41,32 @@ class Tester(Runner):
             - "density": MAPE of the density prediction
             - "dos": MAPE of the DOS prediction
 
+    output_format : string
+        Can be "list" or "mae". If "list", then a list of results across all
+        snapshots is returned. If "mae", then the MAE across all snapshots
+        will be calculated and returned.
+
+    Attributes
+    ----------
+    target_calculator : mala.targets.target.Target
+        Target calculator used for predictions. Can be used for further
+        processing.
+
+    observables_to_test : list
+        List of observables to test. Supported are:
+
+            - "ldos": Calculate the MSE loss of the LDOS.
+            - "band_energy": Band energy error
+            - "band_energy_full": Band energy absolute values (only works with
+              list, as both actual and predicted are returned)
+            - "total_energy": Total energy error
+            - "total_energy_full": Total energy absolute values (only works
+              with list, as both actual and predicted are returned)
+            - "number_of_electrons": Number of electrons (Fermi energy is not
+              determined dynamically for this quantity.
+            - "density": MAPE of the density prediction
+            - "dos": MAPE of the DOS prediction
+
     output_format : string
         Can be "list" or "mae". If "list", then a list of results across all
         snapshots is returned. If "mae", then the MAE across all snapshots
@@ -57,8 +83,8 @@ def __init__(
     ):
         # copy the parameters into the class.
         super(Tester, self).__init__(params, network, data)
-        self.test_data_loader = None
-        self.number_of_batches_per_snapshot = 0
+        self._test_data_loader = None
+        self._number_of_batches_per_snapshot = 0
         self.observables_to_test = observables_to_test
         self.output_format = output_format
         if self.output_format != "list" and self.output_format != "mae":
@@ -205,7 +231,7 @@ def predict_targets(self, snapshot_number, data_type="te"):
             offset_snapshots + snapshot_number,
             data_set,
             data_type,
-            self.number_of_batches_per_snapshot,
+            self._number_of_batches_per_snapshot,
             self.parameters.mini_batch_size,
         )
 
@@ -235,6 +261,6 @@ def __prepare_to_test(self, snapshot_number):
                 min_verbosity=0,
             )
             self.parameters.mini_batch_size = optimal_batch_size
-        self.number_of_batches_per_snapshot = int(
+        self._number_of_batches_per_snapshot = int(
             grid_size / self.parameters.mini_batch_size
         )
diff --git a/mala/network/trainer.py b/mala/network/trainer.py
index 85fc52044..3a12f994a 100644
--- a/mala/network/trainer.py
+++ b/mala/network/trainer.py
@@ -38,11 +38,23 @@ class Trainer(Runner):
     data : mala.datahandling.data_handler.DataHandler
         DataHandler holding the training data.
 
-    use_pkl_checkpoints : bool
-        If true, .pkl checkpoints will be created.
+    _optimizer_dict : dict
+        For internal use by the Trainer class during loading procecdures only.
+
+    Attributes
+    ----------
+
+    final_validation_loss : float
+        Validation loss after training
+
+    network : mala.network.network.Network
+        Network which is being trained.
+
+    full_logging_path : str
+        Full path to training logs.
     """
 
-    def __init__(self, params, network, data, optimizer_dict=None):
+    def __init__(self, params, network, data, _optimizer_dict=None):
         # copy the parameters into the class.
         super(Trainer, self).__init__(params, network, data)
 
@@ -56,22 +68,21 @@ def __init__(self, params, network, data, optimizer_dict=None):
             torch.cuda.current_stream().wait_stream(s)
 
         self.final_validation_loss = float("inf")
-        self.initial_validation_loss = float("inf")
-        self.optimizer = None
-        self.scheduler = None
-        self.patience_counter = 0
-        self.last_epoch = 0
-        self.last_loss = None
-        self.training_data_loaders = []
-        self.validation_data_loaders = []
+        self._optimizer = None
+        self._scheduler = None
+        self._patience_counter = 0
+        self._last_epoch = 0
+        self._last_loss = None
+        self._training_data_loaders = []
+        self._validation_data_loaders = []
 
         # Samplers for the ddp case.
-        self.train_sampler = None
-        self.validation_sampler = None
+        self._train_sampler = None
+        self._validation_sampler = None
 
-        self.__prepare_to_train(optimizer_dict)
+        self.__prepare_to_train(_optimizer_dict)
 
-        self.logger = None
+        self._logger = None
         self.full_logging_path = None
         if self.parameters.logger is not None:
             os.makedirs(self.parameters.logging_dir, exist_ok=True)
@@ -92,9 +103,9 @@ def __init__(self, params, network, data, optimizer_dict=None):
             if self.parameters.logger == "wandb":
                 import wandb
 
-                self.logger = wandb
+                self._logger = wandb
             elif self.parameters.logger == "tensorboard":
-                self.logger = SummaryWriter(self.full_logging_path)
+                self._logger = SummaryWriter(self.full_logging_path)
             else:
                 raise Exception(
                     f"Unsupported logger {self.parameters.logger}."
@@ -105,13 +116,13 @@ def __init__(self, params, network, data, optimizer_dict=None):
                 min_verbosity=1,
             )
 
-        self.gradscaler = None
+        self._gradscaler = None
         if self.parameters.use_mixed_precision:
             printout("Using mixed precision via AMP.", min_verbosity=1)
-            self.gradscaler = torch.cuda.amp.GradScaler()
+            self._gradscaler = torch.cuda.amp.GradScaler()
 
-        self.train_graph = None
-        self.validation_graph = None
+        self._train_graph = None
+        self._validation_graph = None
 
     @classmethod
     def run_exists(cls, run_name, params_format="json", zip_run=True):
@@ -253,7 +264,7 @@ def _load_from_run(cls, params, network, data, file=None):
 
         # Now, create the Trainer class with it.
         loaded_trainer = Trainer(
-            params, network, data, optimizer_dict=checkpoint
+            params, network, data, _optimizer_dict=checkpoint
         )
         return loaded_trainer
 
@@ -265,18 +276,15 @@ def train_network(self):
 
         vloss = float("inf")
 
-        # Save losses for later use.
-        self.initial_validation_loss = vloss
-
         # Initialize all the counters.
         checkpoint_counter = 0
 
         # If we restarted from a checkpoint, we have to differently initialize
         # the loss.
-        if self.last_loss is None:
+        if self._last_loss is None:
             vloss_old = vloss
         else:
-            vloss_old = self.last_loss
+            vloss_old = self._last_loss
 
         ############################
         # PERFORM TRAINING
@@ -284,7 +292,9 @@ def train_network(self):
 
         total_batch_id = 0
 
-        for epoch in range(self.last_epoch, self.parameters.max_number_epochs):
+        for epoch in range(
+            self._last_epoch, self.parameters.max_number_epochs
+        ):
             start_time = time.time()
 
             # Prepare model for training.
@@ -298,8 +308,8 @@ def train_network(self):
             )
 
             # train sampler
-            if self.train_sampler:
-                self.train_sampler.set_epoch(epoch)
+            if self._train_sampler:
+                self._train_sampler.set_epoch(epoch)
 
             # shuffle dataset if necessary
             if isinstance(self.data.training_data_sets[0], FastTensorDataset):
@@ -312,7 +322,7 @@ def train_network(self):
                 tsample = time.time()
                 t0 = time.time()
                 batchid = 0
-                for loader in self.training_data_loaders:
+                for loader in self._training_data_loaders:
                     t = time.time()
                     for inputs, outputs in tqdm(
                         loader,
@@ -387,19 +397,19 @@ def train_network(self):
                                     training_loss_sum_logging
                                     / self.parameters.training_log_interval
                                 )
-                                self.logger.add_scalars(
+                                self._logger.add_scalars(
                                     "ldos",
                                     {"during_training": training_loss_mean},
                                     total_batch_id,
                                 )
-                                self.logger.close()
+                                self._logger.close()
                                 training_loss_sum_logging = 0.0
                             if self.parameters.logger == "wandb":
                                 training_loss_mean = (
                                     training_loss_sum_logging
                                     / self.parameters.training_log_interval
                                 )
-                                self.logger.log(
+                                self._logger.log(
                                     {
                                         "ldos_during_training": training_loss_mean
                                     },
@@ -422,7 +432,7 @@ def train_network(self):
                 )
             else:
                 batchid = 0
-                for loader in self.training_data_loaders:
+                for loader in self._training_data_loaders:
                     for inputs, outputs in loader:
                         inputs = inputs.to(
                             self.parameters._configuration["device"]
@@ -473,7 +483,7 @@ def train_network(self):
             if self.parameters.logger == "tensorboard":
                 for dataset_fraction in dataset_fractions:
                     for metric in errors[dataset_fraction]:
-                        self.logger.add_scalars(
+                        self._logger.add_scalars(
                             metric,
                             {
                                 dataset_fraction: errors[dataset_fraction][
@@ -482,11 +492,11 @@ def train_network(self):
                             },
                             total_batch_id,
                         )
-                self.logger.close()
+                self._logger.close()
             if self.parameters.logger == "wandb":
                 for dataset_fraction in dataset_fractions:
                     for metric in errors[dataset_fraction]:
-                        self.logger.log(
+                        self._logger.log(
                             {
                                 f"{dataset_fraction}_{metric}": errors[
                                     dataset_fraction
@@ -510,38 +520,38 @@ def train_network(self):
                 )
 
             # If a scheduler is used, update it.
-            if self.scheduler is not None:
+            if self._scheduler is not None:
                 if (
                     self.parameters.learning_rate_scheduler
                     == "ReduceLROnPlateau"
                 ):
-                    self.scheduler.step(vloss)
+                    self._scheduler.step(vloss)
 
             # If early stopping is used, check if we need to do something.
             if self.parameters.early_stopping_epochs > 0:
                 if vloss < vloss_old * (
                     1.0 - self.parameters.early_stopping_threshold
                 ):
-                    self.patience_counter = 0
+                    self._patience_counter = 0
                     vloss_old = vloss
                 else:
-                    self.patience_counter += 1
+                    self._patience_counter += 1
                     printout(
                         "Validation accuracy has not improved enough.",
                         min_verbosity=1,
                     )
                     if (
-                        self.patience_counter
+                        self._patience_counter
                         >= self.parameters.early_stopping_epochs
                     ):
                         printout(
                             "Stopping the training, validation "
                             "accuracy has not improved for",
-                            self.patience_counter,
+                            self._patience_counter,
                             "epochs.",
                             min_verbosity=1,
                         )
-                        self.last_epoch = epoch
+                        self._last_epoch = epoch
                         break
 
             # If checkpointing is enabled, we need to checkpoint.
@@ -552,8 +562,8 @@ def train_network(self):
                     >= self.parameters.checkpoints_each_epoch
                 ):
                     printout("Checkpointing training.", min_verbosity=0)
-                    self.last_epoch = epoch
-                    self.last_loss = vloss_old
+                    self._last_epoch = epoch
+                    self._last_loss = vloss_old
                     self.__create_training_checkpoint()
                     checkpoint_counter = 0
 
@@ -590,8 +600,8 @@ def train_network(self):
 
         # Clean-up for pre-fetching lazy loading.
         if self.data.parameters.use_lazy_loading_prefetch:
-            self.training_data_loaders.cleanup()
-            self.validation_data_loaders.cleanup()
+            self._training_data_loaders.cleanup()
+            self._validation_data_loaders.cleanup()
 
     def _validate_network(self, data_set_fractions, metrics):
         # """Validate a network, using train or validation data."""
@@ -599,13 +609,13 @@ def _validate_network(self, data_set_fractions, metrics):
         errors = {}
         for data_set_type in data_set_fractions:
             if data_set_type == "train":
-                data_loaders = self.training_data_loaders
+                data_loaders = self._training_data_loaders
                 data_sets = self.data.training_data_sets
                 number_of_snapshots = self.data.nr_training_snapshots
                 offset_snapshots = 0
 
             elif data_set_type == "validation":
-                data_loaders = self.validation_data_loaders
+                data_loaders = self._validation_data_loaders
                 data_sets = self.data.validation_data_sets
                 number_of_snapshots = self.data.nr_validation_snapshots
                 offset_snapshots = self.data.nr_training_snapshots
@@ -720,11 +730,11 @@ def __prepare_to_train(self, optimizer_dict):
 
         # Read last epoch
         if optimizer_dict is not None:
-            self.last_epoch = optimizer_dict["epoch"] + 1
+            self._last_epoch = optimizer_dict["epoch"] + 1
 
         # Scale the learning rate according to ddp.
         if self.parameters_full.use_ddp:
-            if dist.get_world_size() > 1 and self.last_epoch == 0:
+            if dist.get_world_size() > 1 and self._last_epoch == 0:
                 printout(
                     "Rescaling learning rate because multiple workers are"
                     " used for training.",
@@ -736,20 +746,20 @@ def __prepare_to_train(self, optimizer_dict):
 
         # Choose an optimizer to use.
         if self.parameters.optimizer == "SGD":
-            self.optimizer = optim.SGD(
+            self._optimizer = optim.SGD(
                 self.network.parameters(),
                 lr=self.parameters.learning_rate,
                 weight_decay=self.parameters.l2_regularization,
             )
         elif self.parameters.optimizer == "Adam":
-            self.optimizer = optim.Adam(
+            self._optimizer = optim.Adam(
                 self.network.parameters(),
                 lr=self.parameters.learning_rate,
                 weight_decay=self.parameters.l2_regularization,
             )
         elif self.parameters.optimizer == "FusedAdam":
             if version.parse(torch.__version__) >= version.parse("1.13.0"):
-                self.optimizer = optim.Adam(
+                self._optimizer = optim.Adam(
                     self.network.parameters(),
                     lr=self.parameters.learning_rate,
                     weight_decay=self.parameters.l2_regularization,
@@ -762,11 +772,11 @@ def __prepare_to_train(self, optimizer_dict):
 
         # Load data from pytorch file.
         if optimizer_dict is not None:
-            self.optimizer.load_state_dict(
+            self._optimizer.load_state_dict(
                 optimizer_dict["optimizer_state_dict"]
             )
-            self.patience_counter = optimizer_dict["early_stopping_counter"]
-            self.last_loss = optimizer_dict["early_stopping_last_loss"]
+            self._patience_counter = optimizer_dict["early_stopping_counter"]
+            self._last_loss = optimizer_dict["early_stopping_last_loss"]
 
         if self.parameters_full.use_ddp:
             # scaling the batch size for multiGPU per node
@@ -781,7 +791,7 @@ def __prepare_to_train(self, optimizer_dict):
             if self.data.parameters.use_lazy_loading:
                 do_shuffle = False
 
-            self.train_sampler = (
+            self._train_sampler = (
                 torch.utils.data.distributed.DistributedSampler(
                     self.data.training_data_sets[0],
                     num_replicas=dist.get_world_size(),
@@ -789,7 +799,7 @@ def __prepare_to_train(self, optimizer_dict):
                     shuffle=do_shuffle,
                 )
             )
-            self.validation_sampler = (
+            self._validation_sampler = (
                 torch.utils.data.distributed.DistributedSampler(
                     self.data.validation_data_sets[0],
                     num_replicas=dist.get_world_size(),
@@ -800,8 +810,8 @@ def __prepare_to_train(self, optimizer_dict):
 
         # Instantiate the learning rate scheduler, if necessary.
         if self.parameters.learning_rate_scheduler == "ReduceLROnPlateau":
-            self.scheduler = optim.lr_scheduler.ReduceLROnPlateau(
-                self.optimizer,
+            self._scheduler = optim.lr_scheduler.ReduceLROnPlateau(
+                self._optimizer,
                 patience=self.parameters.learning_rate_patience,
                 mode="min",
                 factor=self.parameters.learning_rate_decay,
@@ -811,8 +821,8 @@ def __prepare_to_train(self, optimizer_dict):
             pass
         else:
             raise Exception("Unsupported learning rate schedule.")
-        if self.scheduler is not None and optimizer_dict is not None:
-            self.scheduler.load_state_dict(
+        if self._scheduler is not None and optimizer_dict is not None:
+            self._scheduler.load_state_dict(
                 optimizer_dict["lr_scheduler_state_dict"]
             )
 
@@ -848,11 +858,11 @@ def __prepare_to_train(self, optimizer_dict):
         if isinstance(self.data.training_data_sets[0], FastTensorDataset):
             # Not shuffling in loader.
             # I manually shuffle the data set each epoch.
-            self.training_data_loaders.append(
+            self._training_data_loaders.append(
                 DataLoader(
                     self.data.training_data_sets[0],
                     batch_size=None,
-                    sampler=self.train_sampler,
+                    sampler=self._train_sampler,
                     **kwargs,
                     shuffle=False,
                 )
@@ -861,26 +871,26 @@ def __prepare_to_train(self, optimizer_dict):
             if isinstance(
                 self.data.training_data_sets[0], LazyLoadDatasetSingle
             ):
-                self.training_data_loaders = MultiLazyLoadDataLoader(
+                self._training_data_loaders = MultiLazyLoadDataLoader(
                     self.data.training_data_sets, **kwargs
                 )
             else:
-                self.training_data_loaders.append(
+                self._training_data_loaders.append(
                     DataLoader(
                         self.data.training_data_sets[0],
                         batch_size=self.parameters.mini_batch_size,
-                        sampler=self.train_sampler,
+                        sampler=self._train_sampler,
                         **kwargs,
                         shuffle=do_shuffle,
                     )
                 )
 
         if isinstance(self.data.validation_data_sets[0], FastTensorDataset):
-            self.validation_data_loaders.append(
+            self._validation_data_loaders.append(
                 DataLoader(
                     self.data.validation_data_sets[0],
                     batch_size=None,
-                    sampler=self.validation_sampler,
+                    sampler=self._validation_sampler,
                     **kwargs,
                 )
             )
@@ -888,15 +898,15 @@ def __prepare_to_train(self, optimizer_dict):
             if isinstance(
                 self.data.validation_data_sets[0], LazyLoadDatasetSingle
             ):
-                self.validation_data_loaders = MultiLazyLoadDataLoader(
+                self._validation_data_loaders = MultiLazyLoadDataLoader(
                     self.data.validation_data_sets, **kwargs
                 )
             else:
-                self.validation_data_loaders.append(
+                self._validation_data_loaders.append(
                     DataLoader(
                         self.data.validation_data_sets[0],
                         batch_size=self.parameters.mini_batch_size * 1,
-                        sampler=self.validation_sampler,
+                        sampler=self._validation_sampler,
                         **kwargs,
                     )
                 )
@@ -904,7 +914,7 @@ def __prepare_to_train(self, optimizer_dict):
     def __process_mini_batch(self, network, input_data, target_data):
         """Process a mini batch."""
         if self.parameters._configuration["gpu"]:
-            if self.parameters.use_graphs and self.train_graph is None:
+            if self.parameters.use_graphs and self._train_graph is None:
                 printout("Capturing CUDA graph for training.", min_verbosity=2)
                 s = torch.cuda.Stream(self.parameters._configuration["device"])
                 s.wait_stream(
@@ -931,8 +941,8 @@ def __process_mini_batch(self, network, input_data, target_data):
                                     prediction, target_data
                                 )
 
-                        if self.gradscaler:
-                            self.gradscaler.scale(loss).backward()
+                        if self._gradscaler:
+                            self._gradscaler.scale(loss).backward()
                         else:
                             loss.backward()
                 torch.cuda.current_stream(
@@ -940,38 +950,40 @@ def __process_mini_batch(self, network, input_data, target_data):
                 ).wait_stream(s)
 
                 # Create static entry point tensors to graph
-                self.static_input_data = torch.empty_like(input_data)
-                self.static_target_data = torch.empty_like(target_data)
+                self._static_input_data = torch.empty_like(input_data)
+                self._static_target_data = torch.empty_like(target_data)
 
                 # Capture graph
-                self.train_graph = torch.cuda.CUDAGraph()
+                self._train_graph = torch.cuda.CUDAGraph()
                 network.zero_grad(set_to_none=True)
-                with torch.cuda.graph(self.train_graph):
+                with torch.cuda.graph(self._train_graph):
                     with torch.cuda.amp.autocast(
                         enabled=self.parameters.use_mixed_precision
                     ):
-                        self.static_prediction = network(
-                            self.static_input_data
+                        self._static_prediction = network(
+                            self._static_input_data
                         )
 
                         if self.parameters_full.use_ddp:
-                            self.static_loss = network.module.calculate_loss(
-                                self.static_prediction, self.static_target_data
+                            self._static_loss = network.module.calculate_loss(
+                                self._static_prediction,
+                                self._static_target_data,
                             )
                         else:
-                            self.static_loss = network.calculate_loss(
-                                self.static_prediction, self.static_target_data
+                            self._static_loss = network.calculate_loss(
+                                self._static_prediction,
+                                self._static_target_data,
                             )
 
-                    if self.gradscaler:
-                        self.gradscaler.scale(self.static_loss).backward()
+                    if self._gradscaler:
+                        self._gradscaler.scale(self._static_loss).backward()
                     else:
-                        self.static_loss.backward()
+                        self._static_loss.backward()
 
-            if self.train_graph:
-                self.static_input_data.copy_(input_data)
-                self.static_target_data.copy_(target_data)
-                self.train_graph.replay()
+            if self._train_graph:
+                self._static_input_data.copy_(input_data)
+                self._static_target_data.copy_(target_data)
+                self._train_graph.replay()
             else:
                 torch.cuda.nvtx.range_push("zero_grad")
                 self.network.zero_grad(set_to_none=True)
@@ -1001,24 +1013,24 @@ def __process_mini_batch(self, network, input_data, target_data):
                     # loss
                     torch.cuda.nvtx.range_pop()
 
-                if self.gradscaler:
-                    self.gradscaler.scale(loss).backward()
+                if self._gradscaler:
+                    self._gradscaler.scale(loss).backward()
                 else:
                     loss.backward()
 
             t = time.time()
             torch.cuda.nvtx.range_push("optimizer")
-            if self.gradscaler:
-                self.gradscaler.step(self.optimizer)
-                self.gradscaler.update()
+            if self._gradscaler:
+                self._gradscaler.step(self._optimizer)
+                self._gradscaler.update()
             else:
-                self.optimizer.step()
+                self._optimizer.step()
             dt = time.time() - t
             printout(f"optimizer time: {dt}", min_verbosity=3)
             torch.cuda.nvtx.range_pop()  # optimizer
 
-            if self.train_graph:
-                return self.static_loss
+            if self._train_graph:
+                return self._static_loss
             else:
                 return loss
         else:
@@ -1028,8 +1040,8 @@ def __process_mini_batch(self, network, input_data, target_data):
             else:
                 loss = network.calculate_loss(prediction, target_data)
             loss.backward()
-            self.optimizer.step()
-            self.optimizer.zero_grad()
+            self._optimizer.step()
+            self._optimizer.zero_grad()
             return loss
 
     def __create_training_checkpoint(self):
@@ -1046,20 +1058,20 @@ def __create_training_checkpoint(self):
         if self.parameters_full.use_ddp:
             if dist.get_rank() != 0:
                 return
-        if self.scheduler is None:
+        if self._scheduler is None:
             save_dict = {
-                "epoch": self.last_epoch,
-                "optimizer_state_dict": self.optimizer.state_dict(),
-                "early_stopping_counter": self.patience_counter,
-                "early_stopping_last_loss": self.last_loss,
+                "epoch": self._last_epoch,
+                "optimizer_state_dict": self._optimizer.state_dict(),
+                "early_stopping_counter": self._patience_counter,
+                "early_stopping_last_loss": self._last_loss,
             }
         else:
             save_dict = {
-                "epoch": self.last_epoch,
-                "optimizer_state_dict": self.optimizer.state_dict(),
-                "lr_scheduler_state_dict": self.scheduler.state_dict(),
-                "early_stopping_counter": self.patience_counter,
-                "early_stopping_last_loss": self.last_loss,
+                "epoch": self._last_epoch,
+                "optimizer_state_dict": self._optimizer.state_dict(),
+                "lr_scheduler_state_dict": self._scheduler.state_dict(),
+                "early_stopping_counter": self._patience_counter,
+                "early_stopping_last_loss": self._last_loss,
             }
         torch.save(
             save_dict, optimizer_name, _use_new_zipfile_serialization=False
diff --git a/test/checkpoint_training_test.py b/test/checkpoint_training_test.py
index 3bc5e83e3..610afbd82 100644
--- a/test/checkpoint_training_test.py
+++ b/test/checkpoint_training_test.py
@@ -73,7 +73,7 @@ def test_early_stopping(self):
             learning_rate=0.1,
         )
         trainer.train_network()
-        original_nr_epochs = trainer.last_epoch
+        original_nr_epochs = trainer._last_epoch
 
         # Now do the same, but cut at epoch 22 and see if it recovers the
         # correct result.
@@ -86,7 +86,7 @@ def test_early_stopping(self):
         trainer.train_network()
         trainer = self.__resume_checkpoint(test_checkpoint_name, 40)
         trainer.train_network()
-        last_nr_epochs = trainer.last_epoch
+        last_nr_epochs = trainer._last_epoch
 
         # integer comparison!
         assert original_nr_epochs == last_nr_epochs
diff --git a/test/inference_test.py b/test/inference_test.py
index 956410cc7..84e0e9cca 100644
--- a/test/inference_test.py
+++ b/test/inference_test.py
@@ -33,7 +33,7 @@ def test_unit_conversion(self):
 
         # Confirm that unit conversion does not introduce any errors.
 
-        from_file_1 = data_handler._target_calculator.convert_units(
+        from_file_1 = data_handler.target_calculator.convert_units(
             np.load(
                 os.path.join(data_path, "Be_snapshot" + str(0) + ".out.npy")
             ),
@@ -41,7 +41,7 @@ def test_unit_conversion(self):
         )
         from_file_2 = np.load(
             os.path.join(data_path, "Be_snapshot" + str(0) + ".out.npy")
-        ) * data_handler._target_calculator.convert_units(
+        ) * data_handler.target_calculator.convert_units(
             1, in_units="1/(eV*Bohr^3)"
         )
 

From f099a7caf277253042133519cf5c4d1c3e71f7ef Mon Sep 17 00:00:00 2001
From: Lenz Fiedler <l.fiedler@hzdr.de>
Date: Mon, 25 Nov 2024 17:42:02 +0100
Subject: [PATCH 14/21] Working on Target class

---
 mala/targets/atomic_force.py |  5 ++++
 mala/targets/density.py      | 22 ++++++++++++--
 mala/targets/dos.py          | 11 +++++++
 mala/targets/ldos.py         | 14 +++++++--
 mala/targets/target.py       | 57 +++++++++++++++++++++++++++++++++++-
 5 files changed, 104 insertions(+), 5 deletions(-)

diff --git a/mala/targets/atomic_force.py b/mala/targets/atomic_force.py
index d5e81e4cd..a830b806c 100644
--- a/mala/targets/atomic_force.py
+++ b/mala/targets/atomic_force.py
@@ -3,6 +3,7 @@
 from ase.units import Rydberg, Bohr
 
 from .target import Target
+from mala.common.parallelizer import parallel_warn
 
 
 class AtomicForce(Target):
@@ -24,6 +25,10 @@ def __init__(self, params):
             Parameters used to create this TargetBase object.
 
         """
+        parallel_warn(
+            "The AtomicForce class is currently be developed and"
+            " not feature-complete."
+        )
         super(AtomicForce, self).__init__(params)
 
     def get_feature_size(self):
diff --git a/mala/targets/density.py b/mala/targets/density.py
index 26d183cdf..f4b465dc0 100644
--- a/mala/targets/density.py
+++ b/mala/targets/density.py
@@ -29,12 +29,23 @@
 
 
 class Density(Target):
-    """Postprocessing / parsing functions for the electronic density.
+    """
+    Postprocessing / parsing functions for the electronic density.
 
     Parameters
     ----------
     params : mala.common.parameters.Parameters
         Parameters used to create this Target object.
+
+    Attributes
+    ----------
+    density : numpy.ndarray
+        Electronic charge density as a volumetric array. May be 4D or 2D
+        depending on workflow.
+
+    te_mutex : bool
+        Total energy module mutual exclusion token used to make sure there
+        the total energy module is not initialized twice.
     """
 
     ##############################
@@ -278,6 +289,12 @@ def get_target(self):
 
         This is the generic interface for cached target quantities.
         It should work for all implemented targets.
+
+        Returns
+        -------
+        density : numpy.ndarray
+            Electronic charge density as a volumetric array. May be 4D or 2D
+            depending on workflow.
         """
         return self.density
 
@@ -407,7 +424,8 @@ def read_from_cube(self, path, units="1/Bohr^3", **kwargs):
             Units the density is saved in. Usually none.
         """
         printout("Reading density from .cube file ", path, min_verbosity=0)
-        # automatically convert units if they are None since cube files take atomic units
+        # automatically convert units if they are None since cube files take
+        # atomic units
         if units is None:
             units = "1/Bohr^3"
         if units != "1/Bohr^3":
diff --git a/mala/targets/dos.py b/mala/targets/dos.py
index faac8dfa4..2ce7bcb76 100644
--- a/mala/targets/dos.py
+++ b/mala/targets/dos.py
@@ -28,6 +28,11 @@ class DOS(Target):
     ----------
     params : mala.common.parameters.Parameters
         Parameters used to create this TargetBase object.
+
+    Attributes
+    ----------
+    density_of_states : numpy.ndarray
+        Electronic density of states.
     """
 
     ##############################
@@ -248,6 +253,12 @@ def get_target(self):
 
         This is the generic interface for cached target quantities.
         It should work for all implemented targets.
+
+        Returns
+        -------
+        density_of_states : numpy.ndarray
+            Electronic density of states.
+
         """
         return self.density_of_states
 
diff --git a/mala/targets/ldos.py b/mala/targets/ldos.py
index 4b2f4bbae..363af7f11 100644
--- a/mala/targets/ldos.py
+++ b/mala/targets/ldos.py
@@ -34,6 +34,13 @@ class LDOS(Target):
     ----------
     params : mala.common.parameters.Parameters
         Parameters used to create this LDOS object.
+
+    Attributes
+    ----------
+
+    local_density_of_states : numpy.ndarray
+        Electronic local density of states as a volumetric array.
+        May be 4D- or 2D depending on workflow.
     """
 
     ##############################
@@ -239,6 +246,11 @@ def get_target(self):
 
         This is the generic interface for cached target quantities.
         It should work for all implemented targets.
+
+        Returns
+        local_density_of_states : numpy.ndarray
+            Electronic local density of states as a volumetric array.
+            May be 4D- or 2D depending on workflow.
         """
         return self.local_density_of_states
 
@@ -598,8 +610,6 @@ def get_total_energy(
         If neither LDOS nor DOS+Density data is provided, the cached LDOS will
         be attempted to be used for the calculation.
 
-
-
         Parameters
         ----------
         ldos_data : numpy.array
diff --git a/mala/targets/target.py b/mala/targets/target.py
index 52664353b..6b5e466f5 100644
--- a/mala/targets/target.py
+++ b/mala/targets/target.py
@@ -34,11 +34,66 @@ class Target(PhysicalData):
     (i.e. the quantity the NN will learn to predict) from a specified file
     format and performs postprocessing calculations on the quantity.
 
+    Target parsers often read DFT reference information.
+
     Parameters
     ----------
     params : mala.common.parameters.Parameters or
     mala.common.parameters.ParametersTargets
         Parameters used to create this Target object.
+
+    Attributes
+    ----------
+    atomic_forces_dft : numpy.ndarray
+        Atomic forces as per DFT reference file.
+
+    atoms : ase.Atoms
+        ASE atoms object used for calculations.
+
+    band_energy_dft_calculation
+        Band energy as per DFT reference file.
+
+    electrons_per_atom : int
+        Electrons per atom, usually determined by DFT reference file.
+
+    entropy_contribution_dft_calculation : float
+        Electronic entropy contribution as per DFT reference file.
+
+    fermi_energy_dft : float
+        Fermi energy as per DFT reference file.
+
+    kpoints : list
+        k-grid used for MALA calculations. Managed internally.
+
+    local_grid : list
+        Size of local grid (in MPI mode).
+
+    number_of_electrons_exact
+        Exact number of electrons, usually given via DFT reference file.
+
+    number_of_electrons_from_eigenvals : float
+        Number of electrons as calculated from DFT reference eigenvalues.
+
+    parameters : mala.common.parameters.ParametersTarget
+        MALA target calculation parameters.
+
+    qe_input_data : dict
+        Quantum ESPRESSO data dictionary, read from DFT reference file and
+        used for the total energy module.
+
+    qe_pseudopotentials : list
+        List of Quantum ESPRESSO pseudopotentials, read from DFT reference file
+         and used for the total energy module.
+
+    save_target_data : bool
+        Control whether target data will be saved. Can be important for I/O
+        applications. Managed internally, default is True.
+
+    temperature
+    total_energy_contributions_dft_calculation
+    total_energy_dft_calculation
+    voxel
+    y_planes
     """
 
     ##############################
@@ -1608,7 +1663,7 @@ def _process_openpmd_attributes(self, series, iteration, mesh):
             "electrons_per_atom",
             default_value=self.electrons_per_atom,
         )
-        self.number_of_electrons_from_eigenval = (
+        self.number_of_electrons_from_eigenvals = (
             self._get_attribute_if_attribute_exists(
                 iteration,
                 "number_of_electrons_from_eigenvals",

From 5cb768e8f56e854ff7e705bc76794a82c20dbdf3 Mon Sep 17 00:00:00 2001
From: Lenz Fiedler <l.fiedler@hzdr.de>
Date: Mon, 25 Nov 2024 19:59:59 +0100
Subject: [PATCH 15/21] Corrected some mistakes

---
 mala/network/objective_naswot.py | 10 +++++-----
 test/checkpoint_training_test.py |  4 ++--
 2 files changed, 7 insertions(+), 7 deletions(-)

diff --git a/mala/network/objective_naswot.py b/mala/network/objective_naswot.py
index 56108211d..7f2c117de 100644
--- a/mala/network/objective_naswot.py
+++ b/mala/network/objective_naswot.py
@@ -46,10 +46,10 @@ def __init__(
         batch_size=None,
     ):
         super(ObjectiveNASWOT, self).__init__(search_parameters, data_handler)
-        self.trial_type = trial_type
-        self.batch_size = batch_size
-        if self.batch_size is None:
-            self.batch_size = search_parameters.running.mini_batch_size
+        self._trial_type = trial_type
+        self._batch_size = batch_size
+        if self._batch_size is None:
+            self._batch_size = search_parameters.running.mini_batch_size
 
     def __call__(self, trial):
         """
@@ -83,7 +83,7 @@ def __call__(self, trial):
                 self._data_handler.mix_datasets()
             loader = DataLoader(
                 self._data_handler.training_data_sets[0],
-                batch_size=self.batch_size,
+                batch_size=self._batch_size,
                 shuffle=do_shuffle,
             )
             jac = ObjectiveNASWOT.__get_batch_jacobian(net, loader, device)
diff --git a/test/checkpoint_training_test.py b/test/checkpoint_training_test.py
index 610afbd82..46a0b43d0 100644
--- a/test/checkpoint_training_test.py
+++ b/test/checkpoint_training_test.py
@@ -45,7 +45,7 @@ def test_learning_rate(self):
             learning_rate=0.1,
         )
         trainer.train_network()
-        original_learning_rate = trainer.optimizer.param_groups[0]["lr"]
+        original_learning_rate = trainer._optimizer.param_groups[0]["lr"]
 
         # Now do the same, but cut at epoch 22 and see if it recovers the
         # correct result.
@@ -58,7 +58,7 @@ def test_learning_rate(self):
         trainer.train_network()
         trainer = self.__resume_checkpoint(test_checkpoint_name, 40)
         trainer.train_network()
-        new_learning_rate = trainer.optimizer.param_groups[0]["lr"]
+        new_learning_rate = trainer._optimizer.param_groups[0]["lr"]
         assert np.isclose(
             original_learning_rate, new_learning_rate, atol=accuracy
         )

From 949cea0d026625cdf8caf7cc61b2eaddb0ac95dc Mon Sep 17 00:00:00 2001
From: Lenz Fiedler <l.fiedler@hzdr.de>
Date: Mon, 25 Nov 2024 20:40:10 +0100
Subject: [PATCH 16/21] Done with all classes except for Parameters classes

---
 mala/targets/density.py |  2 +-
 mala/targets/target.py  | 42 ++++++++++++++++++++++++++++++++---------
 2 files changed, 34 insertions(+), 10 deletions(-)

diff --git a/mala/targets/density.py b/mala/targets/density.py
index f4b465dc0..f514cf0fa 100644
--- a/mala/targets/density.py
+++ b/mala/targets/density.py
@@ -600,7 +600,7 @@ def get_number_of_electrons(
 
         voxel : ase.cell.Cell
             Voxel to be used for grid intergation. Needs to reflect the
-            symmetry of the simulation cell. In Bohr.
+            symmetry of the simulation cell.
 
         integration_method : str
             Integration method used to integrate density on the grid.
diff --git a/mala/targets/target.py b/mala/targets/target.py
index 6b5e466f5..ebd32f763 100644
--- a/mala/targets/target.py
+++ b/mala/targets/target.py
@@ -89,11 +89,30 @@ class Target(PhysicalData):
         Control whether target data will be saved. Can be important for I/O
         applications. Managed internally, default is True.
 
-    temperature
-    total_energy_contributions_dft_calculation
-    total_energy_dft_calculation
-    voxel
-    y_planes
+    temperature : float
+        Temperature used for all computations. By default read from DFT
+        reference file, but can freely be changed from the outside.
+
+    total_energy_contributions_dft_calculation : dict
+        Dictionary holding contributions to total free energy not given
+        as individual properties, as read from the DFT reference file.
+        Contains:
+
+            - "one_electron_contribution", :math:`n\,V_\mathrm{xc}` plus band
+              energy
+            - "hartree_contribution", :math:`E_\mathrm{H}`
+            - "xc_contribution", :math:`E_\mathrm{xc}`
+            - "ewald_contribution", :math:`E_\mathrm{Ewald}`
+
+    total_energy_dft_calculation : float
+        Total free energy as read from DFT reference file.
+    voxel : ase.cell.Cell
+        Voxel to be used for grid intergation. Reflects the
+        symmetry of the simulation cell. Calculated from DFT reference data.
+
+    y_planes : int
+        Number of y_planes used for Quantum ESPRESSO parallelization. Handled
+        internally.
     """
 
     ##############################
@@ -154,7 +173,6 @@ def __getnewargs__(self):
 
         Used for pickling.
 
-
         Returns
         -------
         params : mala.Parameters
@@ -847,7 +865,14 @@ def get_energy_grid(self):
         raise Exception("No method implement to calculate an energy grid.")
 
     def get_real_space_grid(self):
-        """Get the real space grid."""
+        """
+        Get the real space grid.
+
+        Returns
+        -------
+        grid3D : numpy.ndarray
+            Numpy array holding the entire grid.
+        """
         grid3D = np.zeros(
             (
                 self.grid_dimensions[0],
@@ -1429,8 +1454,7 @@ def write_tem_input_file(
             None.
 
         mpi_rank : int
-            Rank within MPI
-
+            Rank within MPI.
         """
         # Specify grid dimensions, if any are given.
         if (

From b24a9fb364538bf5bea5e4876c5f7e82bd8d489a Mon Sep 17 00:00:00 2001
From: Lenz Fiedler <l.fiedler@hzdr.de>
Date: Mon, 25 Nov 2024 21:25:03 +0100
Subject: [PATCH 17/21] Made some non-overlapping changes in the Parameters
 classes

---
 mala/common/parameters.py | 73 +++++++++++++++++++++++++++++++++++++--
 1 file changed, 70 insertions(+), 3 deletions(-)

diff --git a/mala/common/parameters.py b/mala/common/parameters.py
index eaa30e186..f545afcba 100644
--- a/mala/common/parameters.py
+++ b/mala/common/parameters.py
@@ -169,7 +169,7 @@ def _json_to_member(json_value):
     @classmethod
     def from_json(cls, json_dict):
         """
-        Read this object from a dictionary saved in a JSON file.
+        Read parameters from a dictionary saved in a JSON file.
 
         Parameters
         ----------
@@ -276,6 +276,10 @@ class ParametersNetwork(ParametersBase):
         Number of heads to be used in Multi head attention network
         This should be a divisor of input dimension
         Default: None
+
+    dropout : float
+        Dropout rate for positional encoding in transformer.
+        Default: 0.1
     """
 
     def __init__(self):
@@ -327,7 +331,51 @@ class ParametersDescriptors(ParametersBase):
         descriptor vector. If False, no such cutting is peformed.
 
     atomic_density_sigma : float
-        Sigma used for the calculation of the Gaussian descriptors.
+        Sigma (=width) used for the calculation of the Gaussian descriptors.
+        Explicitly setting this value is discouraged if the atomic density is
+        used only during the total energy calculation and, e.g., bispectrum
+        descriptors are used for models. In this case, the width will
+        automatically be set correctly during inference based on model
+        parameters. This parameter mainly exists for debugging purposes.
+        If the atomic density is instead used for model training itself, this
+        parameter needs to be set.
+
+    atomic_density_cutoff : float
+        Cutoff radius used for atomic density calculation. Explicitly setting
+        this value is discouraged if the atomic density is used only during the
+        total energy calculation and, e.g., bispectrum descriptors are used
+        for models. In this case, the cutoff will automatically be set
+        correctly during inference based on model parameters. This parameter
+        mainly exists for debugging purposes. If the atomic density is instead
+        used for model training itself, this parameter needs to be set.
+
+    descriptor_type : str
+        Type of Descriptors used for model training. Supported are "Bispectrum"
+        and "AtomicDensity", although only the former is currently used for
+        published models.
+
+    lammps_compute_file : str
+        Path to a LAMMPS compute file for the bispectrum descriptor
+        calculation. MALA has its own collection of compute files which are
+        used by default. Setting this parameter is thus not necessarys for
+        model training and inference, and it exists mainly for debugging
+        purposes.
+
+    minterpy_cutoff_cube_size : float
+        WILL BE DEPRECATED IN MALA v1.4.0 - size of cube for minterpy
+        descriptor calculation.
+
+    minterpy_lp_norm : int
+        WILL BE DEPRECATED IN MALA v1.4.0 - LP norm for minterpy
+        descriptor calculation.
+
+    minterpy_point_list : list
+        WILL BE DEPRECATED IN MALA v1.4.0 - list of points for minterpy
+        descriptor calculation.
+
+    minterpy_polynomial_degree : int
+        WILL BE DEPRECATED IN MALA v1.4.0 - polynomial degree for minterpy
+        descriptor calculation.
     """
 
     def __init__(self):
@@ -718,6 +766,14 @@ class ParametersRunning(ParametersBase):
         List with two entries determining with which batch/iteration number
          the CUDA profiler will start and stop profiling. Please note that
          this option only holds significance if the nsys profiler is used.
+
+    inference_data_grid : list
+        Grid dimensions used during inference. Typically, these are automatically
+        determined by DFT reference data, and this parameter does not need to
+        be set. Thus, this parameter mainly exists for debugging purposes.
+
+    use_mixed_precision :
+        If True, mixed precision computation (via AMP) will be used.
     """
 
     def __init__(self):
@@ -726,7 +782,6 @@ def __init__(self):
         self.learning_rate = 10 ** (-5)
         self.learning_rate_embedding = 10 ** (-4)
         self.max_number_epochs = 100
-        self.verbosity = True
         self.mini_batch_size = 10
         self.snapshots_per_epoch = -1
 
@@ -975,6 +1030,15 @@ class ParametersHyperparameterOptimization(ParametersBase):
         not recommended because it is file based and can lead to errors;
         With a suitable timeout it can be used somewhat stable though and
         help in HPC settings.
+
+    acsd_points : int
+        Parameter of the ACSD HyperparamterOptimization scheme. Controls
+        the number of point-pairs which are used to compute the ACSD.
+        An array of acsd_points*acsd_points will be computed, i.e., if
+        acsd_points=100, 100 points will be drawn at random, and thereafter
+        each of these 100 points will be compared with a new, random set
+        of 100 points, leading to 10000 points in total for the calculation
+        of the ACSD.
     """
 
     def __init__(self):
@@ -1184,6 +1248,9 @@ class Parameters:
     manual_seed: int
         If not none, this value is used as manual seed for the neural networks.
         Can be used to make experiments comparable. Default: None.
+
+    datageneration : ParametersDataGeneration
+        Parameters used for data generation routines.
     """
 
     def __init__(self):

From 4deab668b219f4dc112e9eb3322239f696bb18f0 Mon Sep 17 00:00:00 2001
From: Lenz Fiedler <l.fiedler@hzdr.de>
Date: Mon, 25 Nov 2024 21:38:30 +0100
Subject: [PATCH 18/21] Fixed a few docstring problems when building

---
 mala/common/parameters.py                  | 17 -----------------
 mala/datageneration/trajectory_analyzer.py |  3 ---
 mala/datahandling/snapshot.py              |  4 ----
 mala/interfaces/ase_calculator.py          |  3 ---
 mala/network/trainer.py                    |  1 -
 mala/targets/density.py                    | 15 ++++-----------
 mala/targets/dos.py                        |  5 -----
 mala/targets/ldos.py                       |  8 +-------
 mala/targets/target.py                     |  6 +-----
 9 files changed, 6 insertions(+), 56 deletions(-)

diff --git a/mala/common/parameters.py b/mala/common/parameters.py
index f545afcba..239409122 100644
--- a/mala/common/parameters.py
+++ b/mala/common/parameters.py
@@ -320,11 +320,6 @@ class ParametersDescriptors(ParametersBase):
         bispectrum descriptors. Default value for jmax is 5, so default value
         for twojmax is 10.
 
-    lammps_compute_file : string
-        Bispectrum calculation: LAMMPS input file that is used to calculate the
-        Bispectrum descriptors. If this string is empty, the standard LAMMPS input
-        file found in this repository will be used (recommended).
-
     descriptors_contain_xyz : bool
         Legacy option. If True, it is assumed that the first three entries of
         the descriptor vector are the xyz coordinates and they are cut from the
@@ -349,11 +344,6 @@ class ParametersDescriptors(ParametersBase):
         mainly exists for debugging purposes. If the atomic density is instead
         used for model training itself, this parameter needs to be set.
 
-    descriptor_type : str
-        Type of Descriptors used for model training. Supported are "Bispectrum"
-        and "AtomicDensity", although only the former is currently used for
-        published models.
-
     lammps_compute_file : str
         Path to a LAMMPS compute file for the bispectrum descriptor
         calculation. MALA has its own collection of compute files which are
@@ -751,13 +741,6 @@ class ParametersRunning(ParametersBase):
         in a subfolder of logging_dir labelled with the starting date
         of the logging, to avoid having to change input scripts often.
 
-    inference_data_grid : list
-        List holding the grid to be used for inference in the form of
-        [x,y,z].
-
-    use_mixed_precision : bool
-        If True, mixed precision computation (via AMP) will be used.
-
     training_log_interval : int
         Determines how often detailed performance info is printed during
         training (only has an effect if the verbosity is high enough).
diff --git a/mala/datageneration/trajectory_analyzer.py b/mala/datageneration/trajectory_analyzer.py
index 09da64ebe..fa0493af7 100644
--- a/mala/datageneration/trajectory_analyzer.py
+++ b/mala/datageneration/trajectory_analyzer.py
@@ -61,9 +61,6 @@ class TrajectoryAnalyzer:
         First snapshot to be considered during equilibration analysis (i.e.,
         after pruning).
 
-    first_snapshot : int
-        First snapshot that can be considered to be equilibrated.
-
     last_considered_snapshot : int
         Last snapshot to be considered during equilibration analysis (i.e.,
         after pruning).
diff --git a/mala/datahandling/snapshot.py b/mala/datahandling/snapshot.py
index 0385da478..1bac8488c 100644
--- a/mala/datahandling/snapshot.py
+++ b/mala/datahandling/snapshot.py
@@ -45,10 +45,6 @@ class Snapshot(JSONSerializable):
 
     Attributes
     ----------
-    calculation_output : string
-        File with the output of the original snapshot calculation. This is
-        only needed when testing multiple snapshots.
-
     grid_dimensions :  list
         Grid dimension [x,y,z].
 
diff --git a/mala/interfaces/ase_calculator.py b/mala/interfaces/ase_calculator.py
index 941f36b7f..66e548dfe 100644
--- a/mala/interfaces/ase_calculator.py
+++ b/mala/interfaces/ase_calculator.py
@@ -46,9 +46,6 @@ class MALA(Calculator):
 
     last_energy_contributions : dict
         Contains all total energy contributions for the last prediction.
-
-    implemented_properties : list
-        List of which properties can be computed by this calculator.
     """
 
     implemented_properties = ["energy"]
diff --git a/mala/network/trainer.py b/mala/network/trainer.py
index 3a12f994a..b5eb0892a 100644
--- a/mala/network/trainer.py
+++ b/mala/network/trainer.py
@@ -43,7 +43,6 @@ class Trainer(Runner):
 
     Attributes
     ----------
-
     final_validation_loss : float
         Validation loss after training
 
diff --git a/mala/targets/density.py b/mala/targets/density.py
index f514cf0fa..61623fe24 100644
--- a/mala/targets/density.py
+++ b/mala/targets/density.py
@@ -36,22 +36,15 @@ class Density(Target):
     ----------
     params : mala.common.parameters.Parameters
         Parameters used to create this Target object.
-
-    Attributes
-    ----------
-    density : numpy.ndarray
-        Electronic charge density as a volumetric array. May be 4D or 2D
-        depending on workflow.
-
-    te_mutex : bool
-        Total energy module mutual exclusion token used to make sure there
-        the total energy module is not initialized twice.
     """
 
     ##############################
     # Class attributes
     ##############################
-
+    """
+    Total energy module mutual exclusion token used to make sure there
+    the total energy module is not initialized twice.
+    """
     te_mutex = False
 
     ##############################
diff --git a/mala/targets/dos.py b/mala/targets/dos.py
index 2ce7bcb76..b1f6f103b 100644
--- a/mala/targets/dos.py
+++ b/mala/targets/dos.py
@@ -28,11 +28,6 @@ class DOS(Target):
     ----------
     params : mala.common.parameters.Parameters
         Parameters used to create this TargetBase object.
-
-    Attributes
-    ----------
-    density_of_states : numpy.ndarray
-        Electronic density of states.
     """
 
     ##############################
diff --git a/mala/targets/ldos.py b/mala/targets/ldos.py
index 363af7f11..c53245003 100644
--- a/mala/targets/ldos.py
+++ b/mala/targets/ldos.py
@@ -34,13 +34,6 @@ class LDOS(Target):
     ----------
     params : mala.common.parameters.Parameters
         Parameters used to create this LDOS object.
-
-    Attributes
-    ----------
-
-    local_density_of_states : numpy.ndarray
-        Electronic local density of states as a volumetric array.
-        May be 4D- or 2D depending on workflow.
     """
 
     ##############################
@@ -248,6 +241,7 @@ def get_target(self):
         It should work for all implemented targets.
 
         Returns
+        -------
         local_density_of_states : numpy.ndarray
             Electronic local density of states as a volumetric array.
             May be 4D- or 2D depending on workflow.
diff --git a/mala/targets/target.py b/mala/targets/target.py
index ebd32f763..10a414c6c 100644
--- a/mala/targets/target.py
+++ b/mala/targets/target.py
@@ -27,7 +27,7 @@
 
 
 class Target(PhysicalData):
-    """
+    r"""
     Base class for all target quantity parser.
 
     Target parsers read the target quantity
@@ -77,10 +77,6 @@ class Target(PhysicalData):
     parameters : mala.common.parameters.ParametersTarget
         MALA target calculation parameters.
 
-    qe_input_data : dict
-        Quantum ESPRESSO data dictionary, read from DFT reference file and
-        used for the total energy module.
-
     qe_pseudopotentials : list
         List of Quantum ESPRESSO pseudopotentials, read from DFT reference file
          and used for the total energy module.

From 9aa1c149f40345f3b9bcacff9e8c6946369d5679 Mon Sep 17 00:00:00 2001
From: Lenz Fiedler <l.fiedler@hzdr.de>
Date: Tue, 26 Nov 2024 11:43:19 +0100
Subject: [PATCH 19/21] Added missing docstring and commented a few redundant
 ones out

---
 mala/common/parameters.py | 25 +++++++++++++++++--------
 1 file changed, 17 insertions(+), 8 deletions(-)

diff --git a/mala/common/parameters.py b/mala/common/parameters.py
index ab19f0654..b929073aa 100644
--- a/mala/common/parameters.py
+++ b/mala/common/parameters.py
@@ -773,24 +773,33 @@ class ParametersRunning(ParametersBase):
         determined by DFT reference data, and this parameter does not need to
         be set. Thus, this parameter mainly exists for debugging purposes.
 
-    use_mixed_precision :
+    use_mixed_precision : bool
         If True, mixed precision computation (via AMP) will be used.
+
+    l2_regularization : float
+        Weight decay rate for NN optimizer.
+
+    dropout : float
+        Dropout rate for positional encoding in transformer net.
+
+    training_log_interval : int
+        Number of data points after which metrics will be logged.
     """
 
     def __init__(self):
         super(ParametersRunning, self).__init__()
         self.optimizer = "Adam"
         self.learning_rate = 10 ** (-5)
-        self.learning_rate_embedding = 10 ** (-4)
+        # self.learning_rate_embedding = 10 ** (-4)
         self.max_number_epochs = 100
         self.mini_batch_size = 10
-        self.snapshots_per_epoch = -1
+        # self.snapshots_per_epoch = -1
 
-        self.l1_regularization = 0.0
+        # self.l1_regularization = 0.0
         self.l2_regularization = 0.0
         self.dropout = 0.0
-        self.batch_norm = False
-        self.input_noise = 0.0
+        # self.batch_norm = False
+        # self.input_noise = 0.0
 
         self.early_stopping_epochs = 0
         self.early_stopping_threshold = 0
@@ -799,11 +808,11 @@ def __init__(self):
         self.learning_rate_patience = 0
         self._during_training_metric = "ldos"
         self._after_training_metric = "ldos"
-        self.use_compression = False
+        # self.use_compression = False
         self.num_workers = 0
         self.use_shuffling_for_samplers = True
         self.checkpoints_each_epoch = 0
-        self.checkpoint_best_so_far = False
+        # self.checkpoint_best_so_far = False
         self.checkpoint_name = "checkpoint_mala"
         self.run_name = ""
         self.logging_dir = "./mala_logging"

From 47ef53cadea39ccd2e85b66223a2ebb7f24f2318 Mon Sep 17 00:00:00 2001
From: Lenz Fiedler <l.fiedler@hzdr.de>
Date: Tue, 26 Nov 2024 11:45:18 +0100
Subject: [PATCH 20/21] Duplicate docstring

---
 mala/common/parameters.py | 3 ---
 1 file changed, 3 deletions(-)

diff --git a/mala/common/parameters.py b/mala/common/parameters.py
index b929073aa..5aa41afc5 100644
--- a/mala/common/parameters.py
+++ b/mala/common/parameters.py
@@ -781,9 +781,6 @@ class ParametersRunning(ParametersBase):
 
     dropout : float
         Dropout rate for positional encoding in transformer net.
-
-    training_log_interval : int
-        Number of data points after which metrics will be logged.
     """
 
     def __init__(self):

From b9e4ed26e7fea4da03c52c7c47b93c8585a548c9 Mon Sep 17 00:00:00 2001
From: Lenz Fiedler <l.fiedler@hzdr.de>
Date: Tue, 26 Nov 2024 14:41:14 +0100
Subject: [PATCH 21/21] Small typo

---
 mala/datahandling/data_scaler.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/mala/datahandling/data_scaler.py b/mala/datahandling/data_scaler.py
index 8064b865a..5840e8816 100644
--- a/mala/datahandling/data_scaler.py
+++ b/mala/datahandling/data_scaler.py
@@ -65,7 +65,7 @@ class DataScaler:
     mins : torch.Tensor
         (Managed internally, not set to private due to legacy issues)
 
-    scale_normal : bool
+    scale_minmax : bool
         (Managed internally, not set to private due to legacy issues)
 
     scale_standard : bool