jax predict and further preprocessing options

pbenner · pbenner · commit 1d0b0d12e178 · 2025-11-10T20:42:14.000+01:00
diff --git a/equitrain/argparser.py b/equitrain/argparser.py
@@ -440,6 +440,12 @@ def get_args_parser(script_type: str) -> argparse.ArgumentParser:
         parser.add_argument(
             '--output-dir', help='Output directory', type=str, default=''
         )
+        parser.add_argument(
+            '--niggli-reduce',
+            help='Apply Niggli reduction to periodic cells before writing HDF5 data',
+            action='store_true',
+            default=False,
+        )
 
     elif script_type == 'train':
         add_common_file_args(parser)
@@ -510,6 +516,12 @@ def get_args_parser(script_type: str) -> argparse.ArgumentParser:
         add_common_data_args(parser)
         add_model_args(parser)
         add_loss_weights_args(parser)
+        parser.add_argument(
+            '--niggli-reduce',
+            help='Apply Niggli reduction before graph construction at inference time',
+            action='store_true',
+            default=False,
+        )
         parser.add_argument(
             '--predict-file',
             help='File with data for which predictions should be computed',
diff --git a/equitrain/backends/jax_backend.py b/equitrain/backends/jax_backend.py
@@ -470,8 +470,13 @@ def train(args):
     if r_max <= 0.0:
         raise RuntimeError('Model configuration must define a positive `r_max`.')
 
-    train_graphs = atoms_to_graphs(args.train_file, r_max, z_table)
-    valid_graphs = atoms_to_graphs(args.valid_file, r_max, z_table)
+    reduce_cells = getattr(args, 'niggli_reduce', False)
+    train_graphs = atoms_to_graphs(
+        args.train_file, r_max, z_table, niggli_reduce=reduce_cells
+    )
+    valid_graphs = atoms_to_graphs(
+        args.valid_file, r_max, z_table, niggli_reduce=reduce_cells
+    )
 
     if not train_graphs:
         raise RuntimeError('Training dataset is empty.')
@@ -755,7 +760,9 @@ def _host(tree):
 
     test_metrics = None
     if getattr(args, 'test_file', None):
-        test_graphs = atoms_to_graphs(args.test_file, r_max, z_table)
+        test_graphs = atoms_to_graphs(
+            args.test_file, r_max, z_table, niggli_reduce=reduce_cells
+        )
         test_loader = build_loader(
             test_graphs,
             batch_size=args.batch_size,
diff --git a/equitrain/backends/jax_evaluate.py b/equitrain/backends/jax_evaluate.py
@@ -44,7 +44,12 @@ def evaluate(args):
     if r_max <= 0.0:
         raise RuntimeError('Model configuration must define a positive `r_max`.')
 
-    test_graphs = atoms_to_graphs(args.test_file, r_max, z_table)
+    test_graphs = atoms_to_graphs(
+        args.test_file,
+        r_max,
+        z_table,
+        niggli_reduce=getattr(args, 'niggli_reduce', False),
+    )
     if not test_graphs:
         raise RuntimeError('Test dataset is empty.')
 
diff --git a/equitrain/backends/jax_predict.py b/equitrain/backends/jax_predict.py
@@ -0,0 +1,130 @@
+from __future__ import annotations
+
+import jax
+import jax.numpy as jnp
+import numpy as np
+from jax import tree_util as jtu
+from mace_jax.data.utils import AtomicNumberTable as JaxAtomicNumberTable
+
+from equitrain.argparser import check_args_complete
+from equitrain.data.backend_jax import atoms_to_graphs, build_loader, make_apply_fn
+
+
+def _is_multi_device() -> bool:
+    return jax.local_device_count() > 1
+
+
+def _prepare_single_batch(graph):
+    def _to_device_array(x):
+        if x is None:
+            return None
+        return jnp.asarray(x)
+
+    return jtu.tree_map(_to_device_array, graph, is_leaf=lambda leaf: leaf is None)
+
+
+def _stack_or_none(chunks):
+    if not chunks:
+        return None
+    return np.concatenate(chunks, axis=0)
+
+
+def predict(args):
+    check_args_complete(args, 'predict')
+    backend = getattr(args, 'backend', 'torch') or 'torch'
+    if backend != 'jax':
+        raise NotImplementedError(
+            f'JAX predict backend invoked with unsupported backend="{backend}".'
+        )
+
+    if getattr(args, 'predict_file', None) is None:
+        raise ValueError('--predict-file is a required argument for JAX prediction.')
+    if getattr(args, 'model', None) is None:
+        raise ValueError('--model is a required argument for JAX prediction.')
+
+    if _is_multi_device():
+        raise NotImplementedError(
+            'JAX prediction currently supports single-device runs only. '
+            'Set XLA flags to limit execution to one device.'
+        )
+
+    bundle = _load_bundle(args.model, dtype=args.dtype)
+
+    atomic_numbers = bundle.config.get('atomic_numbers')
+    if not atomic_numbers:
+        raise RuntimeError('Model configuration is missing `atomic_numbers`.')
+    z_table = JaxAtomicNumberTable(atomic_numbers)
+
+    r_max = (
+        float(args.r_max)
+        if getattr(args, 'r_max', None)
+        else float(bundle.config.get('r_max', 0.0))
+    )
+    if r_max <= 0.0:
+        raise RuntimeError(
+            'Model configuration must define a positive `r_max`, or override via --r-max.'
+        )
+
+    graphs = atoms_to_graphs(
+        args.predict_file,
+        r_max,
+        z_table,
+        niggli_reduce=getattr(args, 'niggli_reduce', False),
+    )
+    loader = build_loader(
+        graphs,
+        batch_size=args.batch_size,
+        shuffle=False,
+        max_nodes=args.batch_max_nodes,
+        max_edges=args.batch_max_edges,
+        drop=getattr(args, 'batch_drop', False),
+    )
+    if loader is None:
+        raise RuntimeError('Prediction dataset is empty.')
+
+    wrapper = _create_wrapper(
+        bundle,
+        compute_force=getattr(args, 'forces_weight', 0.0) > 0.0,
+        compute_stress=getattr(args, 'stress_weight', 0.0) > 0.0,
+    )
+    apply_fn = make_apply_fn(wrapper, num_species=len(z_table))
+    apply_fn = jax.jit(apply_fn)
+
+    energies: list[np.ndarray] = []
+    forces: list[np.ndarray] = []
+    stresses: list[np.ndarray] = []
+
+    for batch in loader:
+        micro_batches = batch if isinstance(batch, list) else [batch]
+        for micro in micro_batches:
+            prepared = _prepare_single_batch(micro)
+            outputs = jax.device_get(apply_fn(bundle.params, prepared))
+            energy_pred = np.asarray(outputs['energy'])
+            energies.append(energy_pred.reshape(-1))
+
+            if outputs.get('forces') is not None:
+                forces.append(np.asarray(outputs['forces']))
+            if outputs.get('stress') is not None:
+                stresses.append(np.asarray(outputs['stress']))
+
+    return _stack_or_none(energies), _stack_or_none(forces), _stack_or_none(stresses)
+
+
+def _load_bundle(model_path: str, dtype: str):
+    from equitrain.backends.jax_utils import load_model_bundle as _load_model_bundle
+
+    return _load_model_bundle(model_path, dtype=dtype)
+
+
+def _create_wrapper(bundle, *, compute_force: bool, compute_stress: bool):
+    from equitrain.backends.jax_wrappers import MaceWrapper as JaxMaceWrapper
+
+    return JaxMaceWrapper(
+        module=bundle.module,
+        config=bundle.config,
+        compute_force=compute_force,
+        compute_stress=compute_stress,
+    )
+
+
+__all__ = ['predict']
diff --git a/equitrain/backends/torch_predict.py b/equitrain/backends/torch_predict.py
@@ -11,6 +11,7 @@
 from equitrain.data.atomic import AtomicNumberTable
 from equitrain.data.backend_torch.atoms_to_graphs import AtomsToGraphs
 from equitrain.data.backend_torch.loaders import get_dataloader
+from equitrain.data.configuration import niggli_reduce_inplace
 
 
 def predict_graphs(
@@ -59,6 +60,7 @@ def predict_atoms(
     pin_memory=False,
     batch_size=12,
     device=None,
+    niggli_reduce: bool = False,
 ) -> list[torch.Tensor]:
     atoms_to_graphs = AtomsToGraphs(
         z_table,
@@ -72,7 +74,12 @@ def predict_atoms(
         r_pbc=True,
     )
 
-    graph_list = [atoms_to_graphs.convert(atom) for atom in atoms_list]
+    graph_list = []
+    for atom in atoms_list:
+        atoms_copy = atom.copy()
+        if niggli_reduce:
+            niggli_reduce_inplace(atoms_copy)
+        graph_list.append(atoms_to_graphs.convert(atoms_copy))
 
     return predict_graphs(
         model,
@@ -93,6 +100,7 @@ def predict_structures(
     pin_memory=False,
     batch_size=12,
     device=None,
+    niggli_reduce: bool = False,
 ) -> list[torch.Tensor]:
     atoms_list = [AseAtomsAdaptor.get_atoms(structure) for structure in structure_list]
     return predict_atoms(
@@ -104,6 +112,7 @@ def predict_structures(
         pin_memory=pin_memory,
         batch_size=batch_size,
         device=device,
+        niggli_reduce=niggli_reduce,
     )
 
 
diff --git a/equitrain/data/backend_jax/atoms_to_graphs.py b/equitrain/data/backend_jax/atoms_to_graphs.py
@@ -10,14 +10,19 @@
 from mace_jax.data.utils import Configuration as JaxConfiguration
 from mace_jax.data.utils import graph_from_configuration
 
-from equitrain.data.configuration import Configuration as EqConfiguration
+from equitrain.data.configuration import (
+    Configuration as EqConfiguration,
+    niggli_reduce_inplace,
+)
 from equitrain.data.format_hdf5.dataset import HDF5Dataset
 
 
 def atoms_to_graphs(
     data_path: Path | str,
     r_max: float,
     z_table: JaxAtomicNumberTable,
+    *,
+    niggli_reduce: bool = False,
 ) -> list[jraph.GraphsTuple]:
     if data_path is None:
         return []
@@ -27,6 +32,9 @@ def atoms_to_graphs(
     try:
         for idx in range(len(dataset)):
             atoms = dataset[idx]
+            if niggli_reduce:
+                atoms = atoms.copy()
+                niggli_reduce_inplace(atoms)
             eq_conf = EqConfiguration.from_atoms(atoms)
             jax_conf = JaxConfiguration(
                 atomic_numbers=eq_conf.atomic_numbers,
diff --git a/equitrain/data/backend_torch/loaders.py b/equitrain/data/backend_torch/loaders.py
@@ -80,7 +80,13 @@ def get_dataloader(
     if data_file is None:
         return None
 
-    data_set = HDF5GraphDataset(data_file, r_max=r_max, atomic_numbers=atomic_numbers)
+    niggli_reduce = getattr(args, 'niggli_reduce', False)
+    data_set = HDF5GraphDataset(
+        data_file,
+        r_max=r_max,
+        atomic_numbers=atomic_numbers,
+        niggli_reduce=niggli_reduce,
+    )
 
     pin_memory = _should_pin_memory(args.pin_memory, accelerator)
     num_workers = _resolve_num_workers(args.workers, accelerator)
diff --git a/equitrain/data/configuration.py b/equitrain/data/configuration.py
@@ -156,3 +156,17 @@ def get_forces(self, apply_constraint=False):
 
     def get_stress(self, apply_constraint=False):
         return self.stress
+
+
+def niggli_reduce_inplace(atoms):
+    """Apply an in-place Niggli reduction when periodic directions exist."""
+    from ase.build.tools import niggli_reduce as _niggli_reduce
+
+    pbc = getattr(atoms, 'pbc', None)
+    if pbc is None:
+        return atoms
+    if not np.any(pbc):
+        return atoms
+
+    _niggli_reduce(atoms)
+    return atoms
diff --git a/equitrain/data/format_hdf5/dataset.py b/equitrain/data/format_hdf5/dataset.py
@@ -5,7 +5,7 @@
 from ase import Atoms
 
 from equitrain.data.atomic import AtomicNumberTable
-from equitrain.data.configuration import CachedCalc
+from equitrain.data.configuration import CachedCalc, niggli_reduce_inplace
 
 
 class HDF5Dataset:
@@ -295,11 +295,13 @@ def __init__(
         r_max: float,
         atomic_numbers: AtomicNumberTable,
         *,
+        niggli_reduce: bool = False,
         atoms_to_graphs_cls=None,
         **kwargs,
     ):
         super().__init__(filename, mode='r', **kwargs)
 
+        self._niggli_reduce = niggli_reduce
         if atoms_to_graphs_cls is None:
             from equitrain.data.backend_torch import (
                 AtomsToGraphs as atoms_to_graphs_cls,
@@ -317,6 +319,8 @@ def __init__(
 
     def __getitem__(self, index):
         atoms = super().__getitem__(index)
+        if self._niggli_reduce:
+            niggli_reduce_inplace(atoms)
         graph = self.converter.convert(atoms)
         graph.idx = index
 
diff --git a/equitrain/data/format_lmdb/lmdb.py b/equitrain/data/format_lmdb/lmdb.py
@@ -130,6 +130,7 @@ def convert_lmdb_to_hdf5(
     dst: Path | str,
     *,
     config: Mapping | None = None,
+    atoms_transform=None,
     overwrite: bool = False,
     show_progress: bool = False,
 ) -> Path:
@@ -145,6 +146,9 @@ def convert_lmdb_to_hdf5(
         ``overwrite`` is ``True``.
     config:
         Optional dictionary passed to ``AseDBDataset`` (e.g. metadata entries).
+    atoms_transform:
+        Optional callable applied to each ``Atoms`` object prior to storage
+        (e.g. lattice reductions).
     overwrite:
         When ``False`` (default) an existing destination file raises ``FileExistsError``.
     show_progress:
@@ -174,6 +178,8 @@ def convert_lmdb_to_hdf5(
     with HDF5Dataset(dst, mode='w') as storage:
         for index, record in enumerate(iterator):
             atoms = lmdb_entry_to_atoms(record)
+            if atoms_transform is not None:
+                atoms = atoms_transform(atoms)
             storage[index] = atoms
 
     return dst
diff --git a/equitrain/predict.py b/equitrain/predict.py
diff --git a/equitrain/preprocess.py b/equitrain/preprocess.py
diff --git a/tests/test_jax_evaluate.py b/tests/test_jax_evaluate.py
diff --git a/tests/test_jax_predict.py b/tests/test_jax_predict.py
diff --git a/tests/test_niggli_predict.py b/tests/test_niggli_predict.py