learningmatter-mit
diff --git a/‎.github/workflows/python-app.yml‎
Lines changed: 47 additions & 0 deletions b/‎.github/workflows/python-app.yml‎
Lines changed: 47 additions & 0 deletions
diff --git a/‎.gitignore‎
Lines changed: 12 additions & 0 deletions b/‎.gitignore‎
Lines changed: 12 additions & 0 deletions
diff --git a/‎nff/analysis/attribution.py‎
Lines changed: 37 additions & 40 deletions b/‎nff/analysis/attribution.py‎
Lines changed: 37 additions & 40 deletions
@@ -0,0 +1,47 @@
+name: Test NeuralForceField package
+
+on: [push]
+
+jobs:
+  build:
+
+    runs-on: ubuntu-latest
+    strategy:
+      matrix:
+        # python-version: ["pypy3.10", "3.8", "3.9", "3.10", "3.11", "3.12", "3.13"]
+        python-version: ["3.10"]
+
+    steps:
+      - uses: actions/checkout@v4
+      - name: Set up Python ${{ matrix.python-version }}
+        uses: actions/setup-python@v5
+        with:
+          python-version: ${{ matrix.python-version }}
+      - name: Display Python version
+        run: python -c "import sys; print(sys.version)"
+      - name: Install basics
+        run: python -m pip install --upgrade pip setuptools wheel
+      - name: Install package
+        run: python -m pip install .
+      # - name: Install linters
+      #   run: python -m pip install flake8 mypy pylint
+      # - name: Install documentation requirements
+      #   run: python -m pip install -r docs/requirements.txt
+      # - name: Test with flake8
+      #   run: flake8 polymethod
+      # - name: Test with mypy
+      #   run: mypy polymethod
+      # - name: Test with pylint
+      #   run: pylint polymethod
+      - name: Test with pytest
+        run: |
+         pip install pytest pytest-cov
+         pytest nff/tests --doctest-modules --junitxml=junit/test-results-${{ matrix.python-version }}.xml --cov=nff --cov-report=xml --cov-report=html
+      - name: Upload pytest test results
+        uses: actions/upload-artifact@v4
+        with:
+          name: pytest-results-${{ matrix.python-version }}
+          path: junit/test-results-${{ matrix.python-version }}.xml
+        if: ${{ always() }}
+      # - name: Test documentation
+      #   run: sphinx-build docs/source docs/build
@@ -66,5 +66,17 @@ dist/
 sandbox_excited/
 build/
 
+# Editor files
+# vim
+*.swp
+*.swo
+
+# pycharm
+.idea/
+
+# coverage and tests
+junit
+.coverage
+
 # required exceptions
 !tutorials/models/ammonia/Ammonia.xyz
@@ -1,18 +1,20 @@
+from typing import Dict, List, Optional, Union
+
+import numpy as np
 import torch
-from ase.io import Trajectory, write
 from ase import Atoms
-import numpy as np
+from ase.io import Trajectory, write
+from tqdm import tqdm
 
-from nff.io.ase_calcs import EnsembleNFF
 from nff.io.ase import AtomsBatch
-from nff.utils.scatter import compute_grad
+from nff.io.ase_calcs import EnsembleNFF
 from nff.utils.cuda import batch_to
-from typing import Union
-
-from tqdm import tqdm
+from nff.utils.scatter import compute_grad
 
 
-def get_molecules(atom: AtomsBatch, bond_length: dict = None, mode: str = "bond", **kwargs) -> list[np.array]:
+def get_molecules(
+    atom: AtomsBatch, bond_length: Optional[Dict[str, float]] = None, mode: str = "bond", **kwargs
+) -> List[np.array]:
     """
     find molecules in periodic or non-periodic system. bond mode finds molecules within bond length.
     Must pass bond_length dict: e.g bond_length=dict()
@@ -29,7 +31,8 @@ def get_molecules(atom: AtomsBatch, bond_length: dict = None, mode: str = "bond"
     give extra cutoff = 6 e.g input
 
     output:
-    list of array of atom indices in molecules. e.g: if there is a H2O molecule, you will get a list with the atom indices
+    list of array of atom indices in molecules. e.g: if there is a H2O molecule,
+    you will get a list with the atom indices
 
     """
     types = list(set(atom.numbers))
@@ -50,15 +53,18 @@ def get_molecules(atom: AtomsBatch, bond_length: dict = None, mode: str = "bond"
         oxy_neighbors = []
         if mode == "bond":
             for t in types:
-                if bond_length.get("%s-%s" % (ty, t)) != None:
+                if bond_length.get(f"{ty}-{t}") is not None:
                     oxy_neighbors.extend(
                         list(
                             np.where(atom.numbers == t)[0][
-                                np.where(dis_sq[i, np.where(atom.numbers == t)[0]] <= bond_length["%s-%s" % (ty, t)])[0]
+                                np.where(dis_sq[i, np.where(atom.numbers == t)[0]] <= bond_length[f"{ty}-{t}"])[0]
                             ]
                         )
                     )
         elif mode == "cutoff":
+            if "cutoff" not in kwargs:
+                raise ValueError("Specifying mode 'cutoff' requires passing a cutoff value as a keyword argument")
+            cutoff = kwargs["cutoff"]
             oxy_neighbors.extend(list(np.where(dis_sq[i] <= cutoff)[0]))  # cutoff input extra argument
         oxy_neighbors = np.array(oxy_neighbors)
         if len(oxy_neighbors) == 0:
@@ -69,10 +75,10 @@ def get_molecules(atom: AtomsBatch, bond_length: dict = None, mode: str = "bond"
         elif (clusters[oxy_neighbors] == 0).all() and clusters[i] == 0:
             clusters[oxy_neighbors] = mm + 1
             clusters[i] = mm + 1
-        elif (clusters[oxy_neighbors] == 0).all() == False and clusters[i] == 0:
+        elif not (clusters[oxy_neighbors] == 0).all() and clusters[i] == 0:
             clusters[i] = min(clusters[oxy_neighbors][clusters[oxy_neighbors] != 0])
             clusters[oxy_neighbors] = min(clusters[oxy_neighbors][clusters[oxy_neighbors] != 0])
-        elif (clusters[oxy_neighbors] == 0).all() == False and clusters[i] != 0:
+        elif not (clusters[oxy_neighbors] == 0).all() and clusters[i] != 0:
             tmp = clusters[oxy_neighbors][clusters[oxy_neighbors] != 0][
                 clusters[oxy_neighbors][clusters[oxy_neighbors] != 0]
                 != min(clusters[oxy_neighbors][clusters[oxy_neighbors] != 0])
@@ -91,17 +97,17 @@ def get_molecules(atom: AtomsBatch, bond_length: dict = None, mode: str = "bond"
     return molecules
 
 
-def reconstruct_atoms(atomsobject: AtomsBatch, mol_idx: list[np.array], centre: int = None):
+def reconstruct_atoms(atomsobject: AtomsBatch, mol_idx: List[np.array], centre: Optional[int] = None):
     """
     Function to shift atoms when we create non-periodic system from periodic.
     inputs:
     atomsobject: Atomsbatch object from NFF
     mol_idx: list of array of atom indices in molecules or atoms you want to keep together when changing to non-periodic
     system
-    centre: by default the atoms in a molecule or set of close atoms are shifted so as to get them close to the centre which
-    is by default the first atom index in the array. For reconstructing molecules this is fine. However, for attribution,
-    we may have to shift a whole molecule to come closer to the atoms with high attribution. In that case, we manually assign
-    the atom index.
+    centre: by default the atoms in a molecule or set of close atoms are shifted so as to get them close
+    to the centre which is by default the first atom index in the array. For reconstructing molecules this is fine.
+    However, for attribution, we may have to shift a whole molecule to come closer to the atoms with high attribution.
+    In that case, we manually assign the atom index.
     """
 
     sys_xyz = torch.Tensor(atomsobject.get_positions(wrap=True))
@@ -111,38 +117,34 @@ def reconstruct_atoms(atomsobject: AtomsBatch, mol_idx: list[np.array], centre:
         mol_xyz = sys_xyz[idx]
         if any(atomsobject.pbc):
             center = mol_xyz.shape[0] // 2
-            if centre != None:
+            if centre is not None:
                 center = centre  # changes the central atom to atom in focus
             intra_dmat = (mol_xyz[None, :, ...] - mol_xyz[:, None, ...])[center]
             if np.count_nonzero(atomsobject.cell.T - np.diag(np.diagonal(atomsobject.cell.T))) != 0:
-                M, N = intra_dmat.shape[0], intra_dmat.shape[1]
+                M, _ = intra_dmat.shape[0], intra_dmat.shape[1]
                 f = torch.linalg.solve(torch.Tensor(atomsobject.cell.T), (intra_dmat.view(-1, 3).T)).T
                 g = f - torch.floor(f + 0.5)
                 intra_dmat = torch.matmul(g, torch.Tensor(atomsobject.cell))
                 intra_dmat = intra_dmat.view(M, 3)
                 offsets = -torch.floor(f + 0.5).view(M, 3)
                 traj_unwrap = mol_xyz + torch.matmul(offsets, torch.Tensor(atomsobject.cell))
             else:
-                sub = (intra_dmat > 0.5 * box_len).to(torch.float) * box_len
-                add = (intra_dmat <= -0.5 * box_len).to(torch.float) * box_len
+                (intra_dmat > 0.5 * box_len).to(torch.float) * box_len
+                (intra_dmat <= -0.5 * box_len).to(torch.float) * box_len
                 shift = torch.round(torch.divide(intra_dmat, box_len))
                 offsets = -shift
                 traj_unwrap = mol_xyz + offsets * box_len
         else:
             traj_unwrap = mol_xyz
-        # traj_unwrap=mol_xyz+add-sub
         sys_xyz[idx] = traj_unwrap
 
     new_pos = sys_xyz.numpy()
 
     return new_pos
 
 
-# -
-
-
 class Attribution:
-    def __init__(self, ensemble: EnsembleNFF, save_file: str = None):
+    def __init__(self, ensemble: EnsembleNFF, save_file: Optional[str] = None):
         self.ensemble = ensemble
         self.save_file = save_file
 
@@ -197,17 +199,15 @@ def calc_attribution_file(
         step: int = 1,
         progress_bar: bool = True,
         to_chemiscope: bool = False,
-        bond_length: dict = None,
+        bond_length: Optional[dict] = None,
     ) -> list:
         attributions = []
         atoms_list = []
         energies = []
         energy_stds = []
         grads = []
         grad_stds = []
-        with tqdm(
-            range(skip, len(traj), step), disable=True if progress_bar == False else False
-        ) as pbar:  # , postfix={"fbest":"?",}) as pbar:
+        with tqdm(range(skip, len(traj), step), disable=not progress_bar) as pbar:  # , postfix={"fbest":"?",}) as pbar:
             # for i in range(skip,len(traj),step):
             for i in pbar:
                 # create atoms batch object
@@ -269,8 +269,7 @@ def calc_attribution_file(
                 },
             }
             return atoms_list, properties
-        else:
-            return attributions
+        return attributions
 
     def activelearning(
         self,
@@ -281,12 +280,10 @@ def activelearning(
         skip: int = 0,
         step: int = 1,
         progress_bar: bool = True,
-        bond_length: dict = None,
+        bond_length: Optional[dict] = None,
     ):
         atom_list = []
-        with tqdm(
-            range(skip, len(traj), step), disable=True if progress_bar == False else False
-        ) as pbar:  # , postfix={"fbest":"?",}) as pbar:
+        with tqdm(range(skip, len(traj), step), disable=not progress_bar) as pbar:  # , postfix={"fbest":"?",}) as pbar:
             # for i in range(skip,len(traj),step):
             for i in pbar:
                 # create atoms batch object
@@ -337,15 +334,15 @@ def activelearning(
                     neighs = np.append(neighs, a)
                     for n in neighs:
                         atomstocare = np.append(atomstocare, molecules[np.where(balanced_mols == n)[0][0]])
-                    atomstocare = np.array((list(set(atomstocare))))
+                    atomstocare = np.array(list(set(atomstocare)))
                     atomstocare = np.int64(atomstocare)
                     atoms1 = atoms[atomstocare]
                     index = np.where(atoms1.positions == atoms.positions[a])[0][0]
                     xyz = reconstruct_atoms(atoms1, [np.arange(0, len(atoms1))], centre=index)
                     atoms1.positions = xyz
                     is_repeated = False
-                    for Atoms in atom_list:
-                        if atoms1.__eq__(Atoms):
+                    for at in atom_list:
+                        if atoms1 == at:
                             is_repeated = True
                             break
                     if not is_repeated: