nomad-coe
diff --git a/‎pyproject.toml‎
Lines changed: 5 additions & 0 deletions b/‎pyproject.toml‎
Lines changed: 5 additions & 0 deletions
diff --git a/‎src/nomad_simulations/schema_packages/common.py‎
Lines changed: 2 additions & 2 deletions b/‎src/nomad_simulations/schema_packages/common.py‎
Lines changed: 2 additions & 2 deletions
diff --git a/‎src/nomad_simulations/schema_packages/errors.py‎
Lines changed: 164 additions & 0 deletions b/‎src/nomad_simulations/schema_packages/errors.py‎
Lines changed: 164 additions & 0 deletions
diff --git a/‎src/nomad_simulations/schema_packages/general.py‎
Lines changed: 2 additions & 41 deletions b/‎src/nomad_simulations/schema_packages/general.py‎
Lines changed: 2 additions & 41 deletions
diff --git a/‎src/nomad_simulations/schema_packages/model_system.py‎
Lines changed: 1 addition & 1 deletion b/‎src/nomad_simulations/schema_packages/model_system.py‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎src/nomad_simulations/schema_packages/numerical_settings.py‎
Lines changed: 3 additions & 2 deletions b/‎src/nomad_simulations/schema_packages/numerical_settings.py‎
Lines changed: 3 additions & 2 deletions
diff --git a/‎src/nomad_simulations/schema_packages/outputs.py‎
Lines changed: 25 additions & 22 deletions b/‎src/nomad_simulations/schema_packages/outputs.py‎
Lines changed: 25 additions & 22 deletions
@@ -39,11 +39,16 @@ dependencies = [
 "Documentation" = "https://nomad-coe.github.io/nomad-simulations/"
 
 [project.optional-dependencies]
+md = [
+    "MDAnalysis>=2.4.0",
+    "networkx"
+]
 dev = [
     'mypy>=1.15',
     'pytest>= 5.3.0, <8',
     'pytest-timeout>=1.4.2',
     'pytest-cov>=2.7.1',
+    'pytest-asyncio>=0.21.0',
     'ruff>=0.6',
     'structlog>=1.0',
     'typing-extensions>=4.12',
 
@@ -4,15 +4,15 @@
 from nomad.metainfo import Datetime, Quantity
 
 
-class Time(ArchiveSection):
+class SimulationTime(ArchiveSection):
     """
     Contains time-related quantities.
     """
 
     datetime_end = Quantity(
         type=Datetime,
         description="""
-        The date and time when this computation ended.
+        The date and time when the computation ended.
         """,
         a_eln=ELNAnnotation(component='DateTimeEditQuantity'),
     )
 
@@ -0,0 +1,164 @@
+import numpy as np
+from nomad.datamodel.data import ArchiveSection
+from nomad.metainfo import MEnum, Quantity, Section, SubSection
+
+
+# TODO This entire module is a prototype, to be tested and refined
+class ErrorEstimate(ArchiveSection):
+    """
+    A generic container for uncertainty/error information associated with a PhysicalProperty.
+
+    Supports:
+      - Scalar or array errors (aligned to the property's `value` shape).
+      - Confidence/prediction intervals.
+      - Named metrics (std, stderr, RMSE, MAE, ...).
+      - Method/provenance metadata (bootstrap, jackknife, analytical, validation).
+    """
+
+    # What kind of measure is this?
+    metric = Quantity(
+        type=MEnum(
+            'std',
+            'stderr',
+            'variance',
+            'rmse',
+            'mae',
+            'mape',
+            'ci',  # confidence interval
+            'pi',  # prediction interval
+            'iqr',
+            'mad',
+            'systematic_bias',
+            'model_uncertainty',
+            'other',
+        ),
+        description="""
+        The type of error or uncertainty metric being reported.
+
+        Allowed values are:
+
+        | Value             | Description                                                                 |
+        |-------------------|-----------------------------------------------------------------------------|
+        | `"std"`           | Standard deviation of the observable.                                       |
+        | `"stderr"`        | Standard error of the mean (std / √N).                                      |
+        | `"variance"`      | Variance of the observable (σ²).                                            |
+        | `"rmse"`          | Root-mean-square error between predictions and reference values.            |
+        | `"mae"`           | Mean absolute error between predictions and reference values.               |
+        | `"mape"`          | Mean absolute percentage error, expressed relative to reference values.     |
+        | `"ci"`            | Confidence interval for the observable, typically with a specified level.   |
+        | `"pi"`            | Prediction interval for new observations.                                   |
+        | `"iqr"`           | Interquartile range (Q3 – Q1).                                              |
+        | `"mad"`           | Median absolute deviation (robust alternative to standard deviation).       |
+        | `"systematic_bias"` | Estimated systematic offset (bias) between observed and true values.      |
+        | `"model_uncertainty"` | Uncertainty arising from the model itself (e.g., ML predictive spread). |
+        | `"other"`         | A different metric not covered above; further specified in `notes` or `definition_iri`. |
+        """,
+    )
+
+    # Optional URI to a formal definition (VIM/GUM, CODATA, or internal ontology)
+    definition_iri = Quantity(
+        type=str, description='IRI/URL pointing to a formal metric definition.'
+    )
+
+    # Optional tags that further qualify the estimate (e.g., "bootstrap", "jackknife", "analytical")
+    method = Quantity(
+        type=str,
+        description='Computation method for the estimate (e.g., bootstrap, jackknife, analytical).',
+    )
+
+    n_samples = Quantity(
+        type=np.int32,
+        description='Number of samples used to compute the estimate (if applicable).',
+    )
+
+    # Scope clarifies where this error applies
+    scope = Quantity(
+        type=MEnum('global', 'per_value', 'per_component', 'per_entity'),
+        description="""
+        The application scope of the estimate:
+        - global: single number applies to the whole property;
+        - per_value: array aligned with the property's value array;
+        - per_component: aligned with a named component axis (see `component_axis`);
+        - per_entity: aligned with referenced entities.
+        """,
+    )
+
+    # If scope == per_component, name the axis (e.g., "spin", "kpoint", "band", "species")
+    component_axis = Quantity(
+        type=str,
+        description='Name of the component axis this estimate aligns to (used with scope=per_component).',
+    )
+
+    # Scalar/array error value (std, stderr, rmse, mae, etc.)
+    value = Quantity(
+        type=np.float64,
+        shape=['*'],  # allow scalar (len 1) or arbitrary flatten/broadcast
+        description='Error/uncertainty values for metrics such as std, stderr, rmse, mae, etc.',
+    )
+
+    # Intervals (confidence or prediction)
+    interval_type = Quantity(
+        type=MEnum('confidence', 'prediction'),
+        description='Type of interval if an interval is provided.',
+    )
+
+    level = Quantity(
+        type=np.float64, description='Interval level (e.g., 0.95 for 95% intervals).'
+    )
+
+    lower = Quantity(
+        type=np.float64,
+        shape=['*'],
+        description='Lower bound of the interval (scalar or array aligned to the target).',
+    )
+
+    upper = Quantity(
+        type=np.float64,
+        shape=['*'],
+        description='Upper bound of the interval (scalar or array aligned to the target).',
+    )
+
+    # Optional note about known systematic effects (units should match the property)
+    bias = Quantity(
+        type=np.float64,
+        shape=['*'],
+        description='Estimated systematic bias (scalar or array).',
+    )
+
+    # Free-form notes (e.g., cross-validation split, dataset, calibration model, etc.)
+    notes = Quantity(
+        type=str, description='Free-text provenance or remarks about the estimate.'
+    )
+
+    def normalize(self, archive, logger):
+        # Basic metric/interval consistency checks (generic, variable-free messages)
+        if self.metric in ('ci', 'pi') and self.interval_type is None:
+            logger.warning(
+                'Interval-type metric is used without specifying an interval type.'
+            )
+
+        if self.interval_type is not None and self.metric not in ('ci', 'pi', 'other'):
+            logger.warning(
+                'Interval type is set but the metric is not an interval metric.'
+            )
+
+        # Level sanity (if provided)
+        if self.level is not None and not (0.0 < self.level < 1.0):
+            logger.warning(
+                'Interval level is outside the typical open interval (0, 1).'
+            )
+
+        # Interval completeness
+        if (self.lower is None) ^ (self.upper is None):
+            logger.warning(
+                'Only one interval bound is provided; both lower and upper are recommended.'
+            )
+
+        # Scope hints
+        if self.scope is None:
+            logger.info(
+                'No scope specified for the error estimate; default interpretation may apply.'
+            )
+
+        # Shape alignment warnings are intentionally generic (no values in logs)
+        # You may later add property-aware checks in PhysicalProperty.normalize if needed.
@@ -22,7 +22,7 @@
 from nomad_simulations.schema_packages.outputs import Outputs
 from nomad_simulations.schema_packages.utils import get_composition, log
 
-from .common import Time
+from .common import SimulationTime
 
 configuration = config.get_plugin_entry_point(
     'nomad_simulations.schema_packages:nomad_simulations_plugin'
@@ -115,7 +115,7 @@ class Program(Entity):
     )
 
 
-class BaseSimulation(Activity, Time):
+class BaseSimulation(Activity, SimulationTime):
     """
     A computational simulation that produces output data from a given input model system
     and input methodological parameters.
@@ -129,45 +129,6 @@ class BaseSimulation(Activity, Time):
         links=['https://liusemweb.github.io/mdo/core/1.1/index.html#Calculation']
     )
 
-    datetime_end = Quantity(
-        type=Datetime,
-        description="""
-        The date and time when this computation ended.
-        """,
-    )
-
-    cpu1_start = Quantity(
-        type=np.float64,
-        unit='second',
-        description="""
-        The starting time of the computation on the (first) CPU 1.
-        """,
-    )
-
-    cpu1_end = Quantity(
-        type=np.float64,
-        unit='second',
-        description="""
-        The end time of the computation on the (first) CPU 1.
-        """,
-    )
-
-    wall_start = Quantity(
-        type=np.float64,
-        unit='second',
-        description="""
-        The internal wall-clock time from the starting of the computation.
-        """,
-    )
-
-    wall_end = Quantity(
-        type=np.float64,
-        unit='second',
-        description="""
-        The internal wall-clock time from the end of the computation.
-        """,
-    )
-
     program = SubSection(sub_section=Program.m_def, repeats=False)
 
 
 
@@ -1500,7 +1500,7 @@ def get_bond_list(self) -> np.ndarray:
         if self._cache.get('bond_list') is not None:
             return self._cache['bond_list']
 
-        bond_list = np.empty((0, 2), dtype=np.int32)
+        bond_list: np.ndarray = np.empty((0, 2), dtype=np.int32)
         # root
         if self.is_root_system():
             bond_list = self.bond_list if self.bond_list is not None else bond_list
 
@@ -381,8 +381,9 @@ def resolve_points_and_offset(
             offset = np.array([0, 0, 0])
         elif self.center == 'Monkhorst-Pack':
             try:
-                points = monkhorst_pack(size=self.grid)
-                offset = get_monkhorst_pack_size_and_offset(kpts=points)[-1]
+                points_array = monkhorst_pack(size=self.grid)
+                points = points_array
+                offset = get_monkhorst_pack_size_and_offset(kpts=points_array)[-1]
             except ValueError:
                 logger.warning(
                     'Could not resolve `KMesh.points` and `KMesh.offset` from `KMesh.grid`. ASE `monkhorst_pack` failed.'
 
@@ -29,16 +29,17 @@
     Permittivity,
     PotentialEnergy,
     QuasiparticleWeight,
+    RadiusOfGyration,
     Temperature,
     TotalEnergy,
     TotalForce,
     XASSpectrum,
 )
 
-from .common import Time
+from .common import SimulationTime
 
 
-class Outputs(Time):
+class Outputs(SimulationTime):
     """
     Output properties of a simulation. This base class can be used for inheritance in any of the output properties
     defined in this schema.
@@ -64,32 +65,28 @@ class Outputs(Time):
         """,
     )
 
+    absorption_spectra = SubSection(sub_section=AbsorptionSpectrum.m_def, repeats=True)
+
     chemical_potentials = SubSection(sub_section=ChemicalPotential.m_def, repeats=True)
 
     crystal_field_splittings = SubSection(
         sub_section=CrystalFieldSplitting.m_def, repeats=True
     )
 
-    hopping_matrices = SubSection(sub_section=HoppingMatrix.m_def, repeats=True)
+    electronic_band_gaps = SubSection(sub_section=ElectronicBandGap.m_def, repeats=True)
 
-    electronic_eigenvalues = SubSection(
-        sub_section=ElectronicEigenvalues.m_def, repeats=True
+    electronic_band_structures = SubSection(
+        sub_section=ElectronicBandStructure.m_def, repeats=True
     )
 
-    electronic_band_gaps = SubSection(sub_section=ElectronicBandGap.m_def, repeats=True)
-
     electronic_dos = SubSection(
         sub_section=ElectronicDensityOfStates.m_def, repeats=True
     )
 
-    fermi_surfaces = SubSection(sub_section=FermiSurface.m_def, repeats=True)
-
-    electronic_band_structures = SubSection(
-        sub_section=ElectronicBandStructure.m_def, repeats=True
+    electronic_eigenvalues = SubSection(
+        sub_section=ElectronicEigenvalues.m_def, repeats=True
     )
 
-    occupancies = SubSection(sub_section=Occupancy.m_def, repeats=True)
-
     electronic_greens_functions = SubSection(
         sub_section=ElectronicGreensFunction.m_def, repeats=True
     )
@@ -98,29 +95,35 @@ class Outputs(Time):
         sub_section=ElectronicSelfEnergy.m_def, repeats=True
     )
 
+    fermi_surfaces = SubSection(sub_section=FermiSurface.m_def, repeats=True)
+
+    hopping_matrices = SubSection(sub_section=HoppingMatrix.m_def, repeats=True)
+
     hybridization_functions = SubSection(
         sub_section=HybridizationFunction.m_def, repeats=True
     )
 
-    quasiparticle_weights = SubSection(
-        sub_section=QuasiparticleWeight.m_def, repeats=True
-    )
+    kinetic_energies = SubSection(sub_section=KineticEnergy.m_def, repeats=True)
+
+    occupancies = SubSection(sub_section=Occupancy.m_def, repeats=True)
 
     permittivities = SubSection(sub_section=Permittivity.m_def, repeats=True)
 
-    absorption_spectra = SubSection(sub_section=AbsorptionSpectrum.m_def, repeats=True)
+    potential_energies = SubSection(sub_section=PotentialEnergy.m_def, repeats=True)
 
-    xas_spectra = SubSection(sub_section=XASSpectrum.m_def, repeats=True)
+    quasiparticle_weights = SubSection(
+        sub_section=QuasiparticleWeight.m_def, repeats=True
+    )
 
-    total_energies = SubSection(sub_section=TotalEnergy.m_def, repeats=True)
+    radii_of_gyration = SubSection(sub_section=RadiusOfGyration.m_def, repeats=True)
 
-    kinetic_energies = SubSection(sub_section=KineticEnergy.m_def, repeats=True)
+    temperatures = SubSection(sub_section=Temperature.m_def, repeats=True)
 
-    potential_energies = SubSection(sub_section=PotentialEnergy.m_def, repeats=True)
+    total_energies = SubSection(sub_section=TotalEnergy.m_def, repeats=True)
 
     total_forces = SubSection(sub_section=TotalForce.m_def, repeats=True)
 
-    temperatures = SubSection(sub_section=Temperature.m_def, repeats=True)
+    xas_spectra = SubSection(sub_section=XASSpectrum.m_def, repeats=True)
 
     # # # # # # # # # # # # # # # # # # # # # # # # # # # # # # # # # # # # # # # # # # # # # #
     # # # # # # # # # # # # # # # # # # # # # # # # # # # # # # # # # # # # # # # # # # # # # #