nomad-coe
diff --git a/‎pyproject.toml‎
Lines changed: 5 additions & 0 deletions b/‎pyproject.toml‎
Lines changed: 5 additions & 0 deletions
diff --git a/‎src/nomad_simulations/schema_packages/atoms_state.py‎
Lines changed: 2 additions & 0 deletions b/‎src/nomad_simulations/schema_packages/atoms_state.py‎
Lines changed: 2 additions & 0 deletions
diff --git a/‎src/nomad_simulations/schema_packages/common.py‎
Lines changed: 2 additions & 2 deletions b/‎src/nomad_simulations/schema_packages/common.py‎
Lines changed: 2 additions & 2 deletions
diff --git a/‎src/nomad_simulations/schema_packages/errors.py‎
Lines changed: 164 additions & 0 deletions b/‎src/nomad_simulations/schema_packages/errors.py‎
Lines changed: 164 additions & 0 deletions
diff --git a/‎src/nomad_simulations/schema_packages/force_field.py‎
Lines changed: 2 additions & 9 deletions b/‎src/nomad_simulations/schema_packages/force_field.py‎
Lines changed: 2 additions & 9 deletions
diff --git a/‎src/nomad_simulations/schema_packages/general.py‎
Lines changed: 2 additions & 41 deletions b/‎src/nomad_simulations/schema_packages/general.py‎
Lines changed: 2 additions & 41 deletions
@@ -39,11 +39,16 @@ dependencies = [
 "Documentation" = "https://nomad-coe.github.io/nomad-simulations/"
 
 [project.optional-dependencies]
+md = [
+    "MDAnalysis>=2.4.0",
+    "networkx"
+]
 dev = [
     'mypy>=1.15',
     'pytest>= 5.3.0, <8',
     'pytest-timeout>=1.4.2',
     'pytest-cov>=2.7.1',
+    'pytest-asyncio>=0.21.0',
     'ruff>=0.6',
     'structlog>=1.0',
     'typing-extensions>=4.12',
 
@@ -8,7 +8,9 @@
 from nomad.units import ureg
 
 if TYPE_CHECKING:
+    from nomad.datamodel.context import Context
     from nomad.datamodel.datamodel import EntryArchive
+    from nomad.metainfo import Section
     from structlog.stdlib import BoundLogger
 
 from nomad_simulations.schema_packages.data_types import (
 
@@ -4,15 +4,15 @@
 from nomad.metainfo import Datetime, Quantity
 
 
-class Time(ArchiveSection):
+class SimulationTime(ArchiveSection):
     """
     Contains time-related quantities.
     """
 
     datetime_end = Quantity(
         type=Datetime,
         description="""
-        The date and time when this computation ended.
+        The date and time when the computation ended.
         """,
         a_eln=ELNAnnotation(component='DateTimeEditQuantity'),
     )
 
@@ -0,0 +1,164 @@
+import numpy as np
+from nomad.datamodel.data import ArchiveSection
+from nomad.metainfo import MEnum, Quantity, Section, SubSection
+
+
+# TODO This entire module is a prototype, to be tested and refined
+class ErrorEstimate(ArchiveSection):
+    """
+    A generic container for uncertainty/error information associated with a PhysicalProperty.
+
+    Supports:
+      - Scalar or array errors (aligned to the property's `value` shape).
+      - Confidence/prediction intervals.
+      - Named metrics (std, stderr, RMSE, MAE, ...).
+      - Method/provenance metadata (bootstrap, jackknife, analytical, validation).
+    """
+
+    # What kind of measure is this?
+    metric = Quantity(
+        type=MEnum(
+            'std',
+            'stderr',
+            'variance',
+            'rmse',
+            'mae',
+            'mape',
+            'ci',  # confidence interval
+            'pi',  # prediction interval
+            'iqr',
+            'mad',
+            'systematic_bias',
+            'model_uncertainty',
+            'other',
+        ),
+        description="""
+        The type of error or uncertainty metric being reported.
+
+        Allowed values are:
+
+        | Value             | Description                                                                 |
+        |-------------------|-----------------------------------------------------------------------------|
+        | `"std"`           | Standard deviation of the observable.                                       |
+        | `"stderr"`        | Standard error of the mean (std / √N).                                      |
+        | `"variance"`      | Variance of the observable (σ²).                                            |
+        | `"rmse"`          | Root-mean-square error between predictions and reference values.            |
+        | `"mae"`           | Mean absolute error between predictions and reference values.               |
+        | `"mape"`          | Mean absolute percentage error, expressed relative to reference values.     |
+        | `"ci"`            | Confidence interval for the observable, typically with a specified level.   |
+        | `"pi"`            | Prediction interval for new observations.                                   |
+        | `"iqr"`           | Interquartile range (Q3 – Q1).                                              |
+        | `"mad"`           | Median absolute deviation (robust alternative to standard deviation).       |
+        | `"systematic_bias"` | Estimated systematic offset (bias) between observed and true values.      |
+        | `"model_uncertainty"` | Uncertainty arising from the model itself (e.g., ML predictive spread). |
+        | `"other"`         | A different metric not covered above; further specified in `notes` or `definition_iri`. |
+        """,
+    )
+
+    # Optional URI to a formal definition (VIM/GUM, CODATA, or internal ontology)
+    definition_iri = Quantity(
+        type=str, description='IRI/URL pointing to a formal metric definition.'
+    )
+
+    # Optional tags that further qualify the estimate (e.g., "bootstrap", "jackknife", "analytical")
+    method = Quantity(
+        type=str,
+        description='Computation method for the estimate (e.g., bootstrap, jackknife, analytical).',
+    )
+
+    n_samples = Quantity(
+        type=np.int32,
+        description='Number of samples used to compute the estimate (if applicable).',
+    )
+
+    # Scope clarifies where this error applies
+    scope = Quantity(
+        type=MEnum('global', 'per_value', 'per_component', 'per_entity'),
+        description="""
+        The application scope of the estimate:
+        - global: single number applies to the whole property;
+        - per_value: array aligned with the property's value array;
+        - per_component: aligned with a named component axis (see `component_axis`);
+        - per_entity: aligned with referenced entities.
+        """,
+    )
+
+    # If scope == per_component, name the axis (e.g., "spin", "kpoint", "band", "species")
+    component_axis = Quantity(
+        type=str,
+        description='Name of the component axis this estimate aligns to (used with scope=per_component).',
+    )
+
+    # Scalar/array error value (std, stderr, rmse, mae, etc.)
+    value = Quantity(
+        type=np.float64,
+        shape=['*'],  # allow scalar (len 1) or arbitrary flatten/broadcast
+        description='Error/uncertainty values for metrics such as std, stderr, rmse, mae, etc.',
+    )
+
+    # Intervals (confidence or prediction)
+    interval_type = Quantity(
+        type=MEnum('confidence', 'prediction'),
+        description='Type of interval if an interval is provided.',
+    )
+
+    level = Quantity(
+        type=np.float64, description='Interval level (e.g., 0.95 for 95% intervals).'
+    )
+
+    lower = Quantity(
+        type=np.float64,
+        shape=['*'],
+        description='Lower bound of the interval (scalar or array aligned to the target).',
+    )
+
+    upper = Quantity(
+        type=np.float64,
+        shape=['*'],
+        description='Upper bound of the interval (scalar or array aligned to the target).',
+    )
+
+    # Optional note about known systematic effects (units should match the property)
+    bias = Quantity(
+        type=np.float64,
+        shape=['*'],
+        description='Estimated systematic bias (scalar or array).',
+    )
+
+    # Free-form notes (e.g., cross-validation split, dataset, calibration model, etc.)
+    notes = Quantity(
+        type=str, description='Free-text provenance or remarks about the estimate.'
+    )
+
+    def normalize(self, archive, logger):
+        # Basic metric/interval consistency checks (generic, variable-free messages)
+        if self.metric in ('ci', 'pi') and self.interval_type is None:
+            logger.warning(
+                'Interval-type metric is used without specifying an interval type.'
+            )
+
+        if self.interval_type is not None and self.metric not in ('ci', 'pi', 'other'):
+            logger.warning(
+                'Interval type is set but the metric is not an interval metric.'
+            )
+
+        # Level sanity (if provided)
+        if self.level is not None and not (0.0 < self.level < 1.0):
+            logger.warning(
+                'Interval level is outside the typical open interval (0, 1).'
+            )
+
+        # Interval completeness
+        if (self.lower is None) ^ (self.upper is None):
+            logger.warning(
+                'Only one interval bound is provided; both lower and upper are recommended.'
+            )
+
+        # Scope hints
+        if self.scope is None:
+            logger.info(
+                'No scope specified for the error estimate; default interpretation may apply.'
+            )
+
+        # Shape alignment warnings are intentionally generic (no values in logs)
+        # You may later add property-aware checks in PhysicalProperty.normalize if needed.
@@ -4,17 +4,10 @@
 # from structlog.stdlib import BoundLogger
 import numpy as np
 from ase.dft.kpoints import get_monkhorst_pack_size_and_offset, monkhorst_pack
+from nomad.datamodel.context import Context
 from nomad.datamodel.data import ArchiveSection
 from nomad.datamodel.metainfo.annotations import ELNAnnotation
-from nomad.metainfo import (
-    JSON,
-    URL,
-    Context,
-    MEnum,
-    Quantity,
-    Section,
-    SubSection,
-)
+from nomad.metainfo import JSON, URL, MEnum, Quantity, Section, SubSection
 from nomad.units import ureg
 from scipy.interpolate import UnivariateSpline
 
 
@@ -22,7 +22,7 @@
 from nomad_simulations.schema_packages.outputs import Outputs
 from nomad_simulations.schema_packages.utils import get_composition, log
 
-from .common import Time
+from .common import SimulationTime
 
 configuration = config.get_plugin_entry_point(
     'nomad_simulations.schema_packages:nomad_simulations_plugin'
@@ -115,7 +115,7 @@ class Program(Entity):
     )
 
 
-class BaseSimulation(Activity, Time):
+class BaseSimulation(Activity, SimulationTime):
     """
     A computational simulation that produces output data from a given input model system
     and input methodological parameters.
@@ -129,45 +129,6 @@ class BaseSimulation(Activity, Time):
         links=['https://liusemweb.github.io/mdo/core/1.1/index.html#Calculation']
     )
 
-    datetime_end = Quantity(
-        type=Datetime,
-        description="""
-        The date and time when this computation ended.
-        """,
-    )
-
-    cpu1_start = Quantity(
-        type=np.float64,
-        unit='second',
-        description="""
-        The starting time of the computation on the (first) CPU 1.
-        """,
-    )
-
-    cpu1_end = Quantity(
-        type=np.float64,
-        unit='second',
-        description="""
-        The end time of the computation on the (first) CPU 1.
-        """,
-    )
-
-    wall_start = Quantity(
-        type=np.float64,
-        unit='second',
-        description="""
-        The internal wall-clock time from the starting of the computation.
-        """,
-    )
-
-    wall_end = Quantity(
-        type=np.float64,
-        unit='second',
-        description="""
-        The internal wall-clock time from the end of the computation.
-        """,
-    )
-
     program = SubSection(sub_section=Program.m_def, repeats=False)