From 2f8e91f02c6a02fb4e789959883a96018c4039a9 Mon Sep 17 00:00:00 2001
From: Linux-cpp-lisp <1473644+Linux-cpp-lisp@users.noreply.github.com>
Date: Fri, 4 Feb 2022 18:16:46 -0500
Subject: [PATCH 01/53] bump

---
 CHANGELOG.md       | 2 +-
 nequip/_version.py | 2 +-
 2 files changed, 2 insertions(+), 2 deletions(-)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index 8ad45d6a..1cfbfa41 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -7,7 +7,7 @@ and this project adheres to [Semantic Versioning](https://semver.org/spec/v2.0.0
 Most recent change on the bottom.
 
 
-## [Unreleased] 
+## [Unreleased] - 0.5.3
 
 ## [0.5.2] - 2022-02-04
 ### Added
diff --git a/nequip/_version.py b/nequip/_version.py
index 1d0ded98..e99ddf2f 100644
--- a/nequip/_version.py
+++ b/nequip/_version.py
@@ -2,4 +2,4 @@
 # See Python packaging guide
 # https://packaging.python.org/guides/single-sourcing-package-version/
 
-__version__ = "0.5.2"
+__version__ = "0.5.3"

From 9cfa922dbaaebf9d5652cbfe204c430017365536 Mon Sep 17 00:00:00 2001
From: Linux-cpp-lisp <1473644+Linux-cpp-lisp@users.noreply.github.com>
Date: Sat, 5 Feb 2022 13:00:58 -0500
Subject: [PATCH 02/53] better error msg

---
 nequip/scripts/evaluate.py | 7 ++++---
 1 file changed, 4 insertions(+), 3 deletions(-)

diff --git a/nequip/scripts/evaluate.py b/nequip/scripts/evaluate.py
index a7d65397..0b5b198d 100644
--- a/nequip/scripts/evaluate.py
+++ b/nequip/scripts/evaluate.py
@@ -211,9 +211,7 @@ def main(args=None, running_as_script: bool = True):
     model.eval()
 
     # Load a config file
-    logger.info(
-        f"Loading {'original ' if dataset_is_from_training else ''}dataset...",
-    )
+    logger.info(f"Loading {'original ' if dataset_is_from_training else ''}dataset...",)
     dataset_config = Config.from_file(
         str(args.dataset_config), defaults={"r_max": model_r_max}
     )
@@ -232,7 +230,10 @@ def main(args=None, running_as_script: bool = True):
             dataset = dataset_from_config(dataset_config, prefix="validation_dataset")
             dataset_is_validation = True
         except KeyError:
+            pass
+        if not dataset_is_validation:
             # Get shared train + validation dataset
+            # prefix `dataset`
             dataset = dataset_from_config(dataset_config)
     logger.info(
         f"Loaded {'validation_' if dataset_is_validation else ''}dataset specified in {args.dataset_config.name}.",

From 9ec7fce481e9003dbc93902b56eefa277e2e22b8 Mon Sep 17 00:00:00 2001
From: nw13slx <nw13mifaso@gmail.com>
Date: Sat, 5 Feb 2022 15:09:03 -0500
Subject: [PATCH 03/53] move update to training script

---
 nequip/scripts/evaluate.py |  4 +++-
 nequip/scripts/train.py    | 23 ++++++++++++++++++++++-
 nequip/train/trainer.py    | 36 ++++++++++++++++++++----------------
 3 files changed, 45 insertions(+), 18 deletions(-)

diff --git a/nequip/scripts/evaluate.py b/nequip/scripts/evaluate.py
index 0b5b198d..22576b23 100644
--- a/nequip/scripts/evaluate.py
+++ b/nequip/scripts/evaluate.py
@@ -211,7 +211,9 @@ def main(args=None, running_as_script: bool = True):
     model.eval()
 
     # Load a config file
-    logger.info(f"Loading {'original ' if dataset_is_from_training else ''}dataset...",)
+    logger.info(
+        f"Loading {'original ' if dataset_is_from_training else ''}dataset...",
+    )
     dataset_config = Config.from_file(
         str(args.dataset_config), defaults={"r_max": model_r_max}
     )
diff --git a/nequip/scripts/train.py b/nequip/scripts/train.py
index d0aac2a7..77fee55f 100644
--- a/nequip/scripts/train.py
+++ b/nequip/scripts/train.py
@@ -15,11 +15,13 @@
 import e3nn
 import e3nn.util.jit
 
+import nequip
 from nequip.model import model_from_config
 from nequip.utils import Config, instantiate
 from nequip.data import dataset_from_config, register_fields
-from nequip.utils.test import assert_AtomicData_equivariant, set_irreps_debug
 from nequip.utils import load_file, dtype_from_name
+from nequip.utils.git import get_commit
+from nequip.utils.test import assert_AtomicData_equivariant, set_irreps_debug
 from nequip.scripts._logger import set_up_script_logger
 
 default_config = dict(
@@ -46,9 +48,24 @@
 )
 
 
+def get_code_version(config):
+    for code in [e3nn, nequip, torch]:
+        config[f"{code.__name__}_version"] = code.__version__
+    codes_for_git = {"e3nn", "nequip"}
+    for builder in config["model_builders"]:
+        if not isinstance(builder, str):
+            continue
+        builder = builder.split(".")
+        if len(builder) > 1:
+            # it's not a single name which is from nequip
+            codes_for_git.add(builder[0])
+    config["code_versions"] = {code: get_commit(code) for code in codes_for_git}
+
+
 def main(args=None, running_as_script: bool = True):
 
     config = parse_command_line(args)
+    get_code_version(config)
 
     if running_as_script:
         set_up_script_logger(config.get("log", None), config.verbose)
@@ -224,6 +241,8 @@ def restart(config):
     )
 
     # compare dictionary to config and update stop condition related arguments
+    # note, "rainer.pth"/dictionary also store code versions,
+    # which will not be stored in cofig and thus not checked here
     for k in config.keys():
         if config[k] != dictionary.get(k, ""):
             if k == "max_epochs":
@@ -245,6 +264,8 @@ def restart(config):
     # dtype, etc.
     _set_global_options(config)
 
+    # note, the from_dict method will check whether the code version
+    # in trainer.pth is consistent and issue warnings
     if config.wandb:
         from nequip.train.trainer_wandb import TrainerWandB
         from nequip.utils.wandb import resume
diff --git a/nequip/train/trainer.py b/nequip/train/trainer.py
index 41b792fe..64fb6828 100644
--- a/nequip/train/trainer.py
+++ b/nequip/train/trainer.py
@@ -518,19 +518,6 @@ def as_dict(
             if hasattr(self, "config_save_path"):
                 dictionary["progress"]["config_save_path"] = self.config_save_path
 
-        for code in [e3nn, nequip, torch]:
-            dictionary[f"{code.__name__}_version"] = code.__version__
-
-        codes_for_git = {"e3nn", "nequip"}
-        for builder in self.model_builders:
-            if not isinstance(builder, str):
-                continue
-            builder = builder.split(".")
-            if len(builder) > 1:
-                # it's not a single name which is from nequip
-                codes_for_git.add(builder[0])
-        dictionary["code_versions"] = {code: get_commit(code) for code in codes_for_git}
-
         return dictionary
 
     def save_config(self, blocking: bool = True) -> None:
@@ -610,12 +597,29 @@ def from_dict(cls, dictionary, append: Optional[bool] = None):
         dictionary = deepcopy(dictionary)
 
         for code in [e3nn, nequip, torch]:
-            version = dictionary.get(f"{code.__name__}_version", None)
-            if version is not None and version != code.__version__:
+            commit = dictionary.get(f"{code.__name__}_version", None)
+            if commit is not None and commit != code.__version__:
                 logging.warning(
                     "Loading a pickled model created with different library version(s) may cause issues."
                     f"current {code.__name__} verion: {code.__version__} "
-                    f"vs  original version: {version}"
+                    f"vs  original version: {commit}"
+                )
+        codes_for_git = {"e3nn", "nequip"}
+        for builder in dictionary["model_builders"]:
+            if not isinstance(builder, str):
+                continue
+            builder = builder.split(".")
+            if len(builder) > 1:
+                # it's not a single name which is from nequip
+                codes_for_git.add(builder[0])
+        for code in codes_for_git:
+            commit = (dictionary.get("code_versions", {})).get(code, None)
+            curr_commit = get_commit(code)
+            if commit is not None and commit != curr_commit:
+                logging.warning(
+                    "Loading a pickled model created with different git version(s) may cause issues."
+                    f"current {code}'s git commit: {curr_commit} "
+                    f"vs  original commit: {commit}"
                 )
 
         # update the restart and append option

From 6bf3a473ab60fb2646dcc01a0cfb6ebe295a45d6 Mon Sep 17 00:00:00 2001
From: nw13slx <nw13mifaso@gmail.com>
Date: Sat, 5 Feb 2022 15:19:18 -0500
Subject: [PATCH 04/53] add sanity check to all scripts

---
 nequip/scripts/benchmark.py |  3 ++-
 nequip/scripts/deploy.py    |  4 +++-
 nequip/scripts/evaluate.py  | 14 +++++++-------
 nequip/scripts/train.py     | 34 ++++++++++++++++++++++++++++++++--
 4 files changed, 44 insertions(+), 11 deletions(-)

diff --git a/nequip/scripts/benchmark.py b/nequip/scripts/benchmark.py
index 609b54c8..f0803ff0 100644
--- a/nequip/scripts/benchmark.py
+++ b/nequip/scripts/benchmark.py
@@ -15,7 +15,7 @@
 from nequip.data import AtomicData, dataset_from_config
 from nequip.model import model_from_config
 from nequip.scripts.deploy import _compile_for_deploy
-from nequip.scripts.train import _set_global_options, default_config
+from nequip.scripts.train import _set_global_options, default_config, check_code_version
 
 
 def main(args=None):
@@ -71,6 +71,7 @@ def main(args=None):
 
     config = Config.from_file(args.config, defaults=default_config)
     _set_global_options(config)
+    check_code_version(config)
 
     # Load dataset to get something to benchmark on
     print("Loading dataset... ")
diff --git a/nequip/scripts/deploy.py b/nequip/scripts/deploy.py
index d9c91ce0..41aa45e3 100644
--- a/nequip/scripts/deploy.py
+++ b/nequip/scripts/deploy.py
@@ -20,7 +20,7 @@
 
 from e3nn.util.jit import script
 
-from nequip.scripts.train import _set_global_options
+from nequip.scripts.train import _set_global_options, check_code_version
 from nequip.train import Trainer
 from nequip.utils import Config
 
@@ -177,6 +177,8 @@ def main(args=None):
         config = Config.from_file(str(args.train_dir / "config.yaml"))
         _set_global_options(config)
 
+        check_code_version(config)
+
         # -- load model --
         model, _ = Trainer.load_model_from_training_session(
             args.train_dir, model_name="best_model.pth", device="cpu"
diff --git a/nequip/scripts/evaluate.py b/nequip/scripts/evaluate.py
index 22576b23..9604e77d 100644
--- a/nequip/scripts/evaluate.py
+++ b/nequip/scripts/evaluate.py
@@ -11,15 +11,12 @@
 
 import torch
 
-from nequip.utils import Config
 from nequip.data import AtomicData, Collater, dataset_from_config, register_fields
-from nequip.train import Trainer
 from nequip.scripts.deploy import load_deployed_model, R_MAX_KEY
-from nequip.scripts.train import default_config, _set_global_options
-from nequip.utils import load_file, instantiate
-from nequip.train.loss import Loss
-from nequip.train.metrics import Metrics
-from ._logger import set_up_script_logger
+from nequip.scripts._logger import set_up_script_logger
+from nequip.scripts.train import default_config, _set_global_options, check_code_version
+from nequip.train import Trainer, Loss, Metrics
+from nequip.utils import load_file, instantiate, Config
 
 
 ORIGINAL_DATASET_INDEX_KEY: str = "original_dataset_index"
@@ -201,6 +198,9 @@ def main(args=None, running_as_script: bool = True):
         global_config = Config.from_file(str(global_config), defaults=default_config)
         _set_global_options(global_config)
         del global_config
+
+        check_code_version(global_config)
+
         # load a training session model
         model, model_config = Trainer.load_model_from_training_session(
             traindir=args.model.parent, model_name=args.model.name
diff --git a/nequip/scripts/train.py b/nequip/scripts/train.py
index 77fee55f..ab23e121 100644
--- a/nequip/scripts/train.py
+++ b/nequip/scripts/train.py
@@ -62,6 +62,34 @@ def get_code_version(config):
     config["code_versions"] = {code: get_commit(code) for code in codes_for_git}
 
 
+def check_code_version(config):
+    for code in [e3nn, nequip, torch]:
+        commit = config.get(f"{code.__name__}_version", None)
+        if commit is not None and commit != code.__version__:
+            logging.warning(
+                "Loading a pickled model created with different library version(s) may cause issues."
+                f"current {code.__name__} verion: {code.__version__} "
+                f"vs  original version: {commit}"
+            )
+    codes_for_git = {"e3nn", "nequip"}
+    for builder in config["model_builders"]:
+        if not isinstance(builder, str):
+            continue
+        builder = builder.split(".")
+        if len(builder) > 1:
+            # it's not a single name which is from nequip
+            codes_for_git.add(builder[0])
+    for code in codes_for_git:
+        commit = (config.get("code_versions", {})).get(code, None)
+        curr_commit = get_commit(code)
+        if commit is not None and commit != curr_commit:
+            logging.warning(
+                "Loading a pickled model created with different git version(s) may cause issues."
+                f"current {code}'s git commit: {curr_commit} "
+                f"vs  original commit: {commit}"
+            )
+
+
 def main(args=None, running_as_script: bool = True):
 
     config = parse_command_line(args)
@@ -241,8 +269,6 @@ def restart(config):
     )
 
     # compare dictionary to config and update stop condition related arguments
-    # note, "rainer.pth"/dictionary also store code versions,
-    # which will not be stored in cofig and thus not checked here
     for k in config.keys():
         if config[k] != dictionary.get(k, ""):
             if k == "max_epochs":
@@ -256,6 +282,10 @@ def restart(config):
                     f'Key "{k}" is different in config and the result trainer.pth file. Please double check'
                 )
 
+    # note, "trainer.pth"/dictionary also store code versions,
+    # which will not be stored in config and thus not checked here
+    check_code_version(config)
+
     # recursive loop, if same type but different value
     # raise error
 

From a8bdd0dae6e90da1db0c6599747e8a2c98540231 Mon Sep 17 00:00:00 2001
From: Linux-cpp-lisp <1473644+Linux-cpp-lisp@users.noreply.github.com>
Date: Sun, 6 Feb 2022 14:32:40 -0500
Subject: [PATCH 05/53] refactoring

---
 nequip/scripts/train.py  | 51 ++--------------------------------
 nequip/utils/git.py      |  6 ++--
 nequip/utils/versions.py | 60 ++++++++++++++++++++++++++++++++++++++++
 3 files changed, 67 insertions(+), 50 deletions(-)
 create mode 100644 nequip/utils/versions.py

diff --git a/nequip/scripts/train.py b/nequip/scripts/train.py
index ab23e121..f67f77b2 100644
--- a/nequip/scripts/train.py
+++ b/nequip/scripts/train.py
@@ -15,13 +15,12 @@
 import e3nn
 import e3nn.util.jit
 
-import nequip
 from nequip.model import model_from_config
 from nequip.utils import Config, instantiate
 from nequip.data import dataset_from_config, register_fields
 from nequip.utils import load_file, dtype_from_name
-from nequip.utils.git import get_commit
 from nequip.utils.test import assert_AtomicData_equivariant, set_irreps_debug
+from nequip.utils.versions import check_code_version
 from nequip.scripts._logger import set_up_script_logger
 
 default_config = dict(
@@ -48,52 +47,8 @@
 )
 
 
-def get_code_version(config):
-    for code in [e3nn, nequip, torch]:
-        config[f"{code.__name__}_version"] = code.__version__
-    codes_for_git = {"e3nn", "nequip"}
-    for builder in config["model_builders"]:
-        if not isinstance(builder, str):
-            continue
-        builder = builder.split(".")
-        if len(builder) > 1:
-            # it's not a single name which is from nequip
-            codes_for_git.add(builder[0])
-    config["code_versions"] = {code: get_commit(code) for code in codes_for_git}
-
-
-def check_code_version(config):
-    for code in [e3nn, nequip, torch]:
-        commit = config.get(f"{code.__name__}_version", None)
-        if commit is not None and commit != code.__version__:
-            logging.warning(
-                "Loading a pickled model created with different library version(s) may cause issues."
-                f"current {code.__name__} verion: {code.__version__} "
-                f"vs  original version: {commit}"
-            )
-    codes_for_git = {"e3nn", "nequip"}
-    for builder in config["model_builders"]:
-        if not isinstance(builder, str):
-            continue
-        builder = builder.split(".")
-        if len(builder) > 1:
-            # it's not a single name which is from nequip
-            codes_for_git.add(builder[0])
-    for code in codes_for_git:
-        commit = (config.get("code_versions", {})).get(code, None)
-        curr_commit = get_commit(code)
-        if commit is not None and commit != curr_commit:
-            logging.warning(
-                "Loading a pickled model created with different git version(s) may cause issues."
-                f"current {code}'s git commit: {curr_commit} "
-                f"vs  original commit: {commit}"
-            )
-
-
 def main(args=None, running_as_script: bool = True):
-
     config = parse_command_line(args)
-    get_code_version(config)
 
     if running_as_script:
         set_up_script_logger(config.get("log", None), config.verbose)
@@ -180,7 +135,8 @@ def _set_global_options(config):
 
 
 def fresh_start(config):
-
+    # we use add_to_config cause it's a fresh start and need to record it
+    check_code_version(config, add_to_config=True)
     _set_global_options(config)
 
     # = Make the trainer =
@@ -259,7 +215,6 @@ def fresh_start(config):
 
 
 def restart(config):
-
     # load the dictionary
     restart_file = f"{config.root}/{config.run_name}/trainer.pth"
     dictionary = load_file(
diff --git a/nequip/utils/git.py b/nequip/utils/git.py
index d58923f3..a78a87fc 100644
--- a/nequip/utils/git.py
+++ b/nequip/utils/git.py
@@ -1,9 +1,11 @@
+from typing import Optional
+
 import subprocess
 from pathlib import Path
 from importlib import import_module
 
 
-def get_commit(module: str):
+def get_commit(module: str) -> Optional[str]:
 
     module = import_module(module)
     path = str(Path(module.__file__).parents[0] / "..")
@@ -18,4 +20,4 @@ def get_commit(module: str):
     if retcode.returncode == 0:
         return retcode.stdout.decode().splitlines()[0].split()[0]
     else:
-        return "NaN"
+        return None
diff --git a/nequip/utils/versions.py b/nequip/utils/versions.py
new file mode 100644
index 00000000..7fb871c1
--- /dev/null
+++ b/nequip/utils/versions.py
@@ -0,0 +1,60 @@
+from typing import Tuple
+
+import logging
+
+import torch
+import e3nn
+import nequip
+
+from .git import get_commit
+
+_DEFAULT_VERSION_CODES = [torch, e3nn, nequip]
+_DEFAULT_COMMIT_CODES = ["e3nn", "nequip"]
+
+_CODE_VERSIONS_KEY = "code_versions"
+_CODE_COMMITS_KEY = "code_commits"
+
+
+def _get_code_versions(config) -> Tuple[dict, dict]:
+    code_versions = {}
+    for code in _DEFAULT_VERSION_CODES:
+        code_versions[code.__name__] = code.__version__
+    code_commits = set(_DEFAULT_COMMIT_CODES)
+    for builder in config["model_builders"]:
+        if not isinstance(builder, str):
+            continue
+        builder = builder.split(".")
+        if len(builder) > 1:
+            # it's not a single name which is from nequip
+            code_commits.add(builder[0])
+    code_commits = {code: get_commit(code) for code in code_commits}
+    code_commits = {k: v for k, v in code_commits.items() if v is not None}
+    return code_versions, code_commits
+
+
+def check_code_version(config, add_to_config: bool = False):
+    current_code_versions, current_code_commits = _get_code_versions(config)
+
+    code_versions = config.get(_CODE_VERSIONS_KEY, {})
+    for code, version in code_versions.items():
+        # we use .get just in case we recorded something in an old version we don't in a new one
+        if version != current_code_versions.get(code, version):
+            logging.warning(
+                "Loading a saved model created with different library version(s) may cause issues."
+                f"current {code} version: {current_code_versions[code]} "
+                f"vs  original version: {version}"
+            )
+
+    code_commits = config.get(_CODE_COMMITS_KEY, {})
+    for code, commit in code_commits.items():
+        # see why .get above
+        if commit != current_code_commits.get(code, commit):
+            logging.warning(
+                "Loading a saved model created with different library git commit(s) may cause issues."
+                f"currently {code}'s git commit: {current_code_commits[code]} "
+                f"vs  original commit: {commit}"
+            )
+
+    if add_to_config:
+        config[_CODE_VERSIONS_KEY] = current_code_versions
+        config[_CODE_COMMITS_KEY] = current_code_commits

From 8e15034e45a2b42ef3234616aaeca2fdc06d7796 Mon Sep 17 00:00:00 2001
From: Linux-cpp-lisp <1473644+Linux-cpp-lisp@users.noreply.github.com>
Date: Sun, 6 Feb 2022 14:33:39 -0500
Subject: [PATCH 06/53] remove duplication

---
 nequip/train/trainer.py | 31 ++-----------------------------
 1 file changed, 2 insertions(+), 29 deletions(-)

diff --git a/nequip/train/trainer.py b/nequip/train/trainer.py
index 64fb6828..63288cdd 100644
--- a/nequip/train/trainer.py
+++ b/nequip/train/trainer.py
@@ -23,11 +23,9 @@
     import contextlib2 as contextlib
 
 import numpy as np
-import e3nn
 import torch
 from torch_ema import ExponentialMovingAverage
 
-import nequip
 from nequip.data import DataLoader, AtomicData, AtomicDataDict, AtomicDataset
 from nequip.utils import (
     Output,
@@ -42,7 +40,7 @@
     atomic_write_group,
     dtype_from_name,
 )
-from nequip.utils.git import get_commit
+from nequip.utils.versions import check_code_version
 from nequip.model import model_from_config
 
 from .loss import Loss, LossStat
@@ -595,32 +593,7 @@ def from_dict(cls, dictionary, append: Optional[bool] = None):
         """
 
         dictionary = deepcopy(dictionary)
-
-        for code in [e3nn, nequip, torch]:
-            commit = dictionary.get(f"{code.__name__}_version", None)
-            if commit is not None and commit != code.__version__:
-                logging.warning(
-                    "Loading a pickled model created with different library version(s) may cause issues."
-                    f"current {code.__name__} verion: {code.__version__} "
-                    f"vs  original version: {commit}"
-                )
-        codes_for_git = {"e3nn", "nequip"}
-        for builder in dictionary["model_builders"]:
-            if not isinstance(builder, str):
-                continue
-            builder = builder.split(".")
-            if len(builder) > 1:
-                # it's not a single name which is from nequip
-                codes_for_git.add(builder[0])
-        for code in codes_for_git:
-            commit = (dictionary.get("code_versions", {})).get(code, None)
-            curr_commit = get_commit(code)
-            if commit is not None and commit != curr_commit:
-                logging.warning(
-                    "Loading a pickled model created with different git version(s) may cause issues."
-                    f"current {code}'s git commit: {curr_commit} "
-                    f"vs  original commit: {commit}"
-                )
+        check_code_version(dictionary)
 
         # update the restart and append option
         if append is not None:

From 34be367dffa56fa1bb6127f57d3faa30b538952f Mon Sep 17 00:00:00 2001
From: Linux-cpp-lisp <1473644+Linux-cpp-lisp@users.noreply.github.com>
Date: Sun, 6 Feb 2022 15:10:46 -0500
Subject: [PATCH 07/53] use backward compatible style

---
 nequip/utils/versions.py | 28 ++++++++++++++++++++--------
 1 file changed, 20 insertions(+), 8 deletions(-)

diff --git a/nequip/utils/versions.py b/nequip/utils/versions.py
index 7fb871c1..fe751600 100644
--- a/nequip/utils/versions.py
+++ b/nequip/utils/versions.py
@@ -11,11 +11,23 @@
 _DEFAULT_VERSION_CODES = [torch, e3nn, nequip]
 _DEFAULT_COMMIT_CODES = ["e3nn", "nequip"]
 
-_CODE_VERSIONS_KEY = "code_versions"
-_CODE_COMMITS_KEY = "code_commits"
+CODE_COMMITS_KEY = "code_commits"
 
 
-def _get_code_versions(config) -> Tuple[dict, dict]:
+def get_config_code_versions(config) -> Tuple[dict, dict]:
+    code_versions = {}
+    for code in _DEFAULT_VERSION_CODES:
+        version = config.get(f"{code.__name__}_version", None)
+        if version is not None:
+            code_versions[code.__name__] = version
+    code_commits = config.get(CODE_COMMITS_KEY, {})
+    if len(code_commits) == 0:
+        # look for the old style
+        code_commits = config.get("code_versions", {})
+    return code_versions, code_commits
+
+
+def get_current_code_versions(config) -> Tuple[dict, dict]:
     code_versions = {}
     for code in _DEFAULT_VERSION_CODES:
         code_versions[code.__name__] = code.__version__
@@ -33,9 +45,9 @@ def _get_code_versions(config) -> Tuple[dict, dict]:
 
 
 def check_code_version(config, add_to_config: bool = False):
-    current_code_versions, current_code_commits = _get_code_versions(config)
+    current_code_versions, current_code_commits = get_current_code_versions(config)
+    code_versions, code_commits = get_config_code_versions(config)
 
-    code_versions = config.get(_CODE_VERSIONS_KEY, {})
     for code, version in code_versions.items():
         # we use .get just in case we recorded something in an old version we don't in a new one
         if version != current_code_versions.get(code, version):
@@ -45,7 +57,6 @@ def check_code_version(config, add_to_config: bool = False):
                 f"vs  original version: {version}"
             )
 
-    code_commits = config.get(_CODE_COMMITS_KEY, {})
     for code, commit in code_commits.items():
         # see why .get above
         if commit != current_code_commits.get(code, commit):
@@ -56,5 +67,6 @@ def check_code_version(config, add_to_config: bool = False):
             )
 
     if add_to_config:
-        config[_CODE_VERSIONS_KEY] = current_code_versions
-        config[_CODE_COMMITS_KEY] = current_code_commits
+        for code, version in code_versions.items():
+            config[f"{code}_version"] = version
+        config[CODE_COMMITS_KEY] = current_code_commits

From 2bd39490aba4044880c530ddb58b0479731a7ca4 Mon Sep 17 00:00:00 2001
From: Linux-cpp-lisp <1473644+Linux-cpp-lisp@users.noreply.github.com>
Date: Sun, 6 Feb 2022 15:13:45 -0500
Subject: [PATCH 08/53] save commit numbers

---
 nequip/scripts/deploy.py | 9 +++++++--
 1 file changed, 7 insertions(+), 2 deletions(-)

diff --git a/nequip/scripts/deploy.py b/nequip/scripts/deploy.py
index 41aa45e3..8348a8a9 100644
--- a/nequip/scripts/deploy.py
+++ b/nequip/scripts/deploy.py
@@ -20,14 +20,16 @@
 
 from e3nn.util.jit import script
 
-from nequip.scripts.train import _set_global_options, check_code_version
+from nequip.scripts.train import _set_global_options
 from nequip.train import Trainer
 from nequip.utils import Config
+from nequip.utils.versions import check_code_version, get_config_code_versions
 
 CONFIG_KEY: Final[str] = "config"
 NEQUIP_VERSION_KEY: Final[str] = "nequip_version"
 TORCH_VERSION_KEY: Final[str] = "torch_version"
 E3NN_VERSION_KEY: Final[str] = "e3nn_version"
+CODE_COMMITS_KEY: Final[str] = "code_commits"
 R_MAX_KEY: Final[str] = "r_max"
 N_SPECIES_KEY: Final[str] = "n_species"
 TYPE_NAMES_KEY: Final[str] = "type_names"
@@ -190,8 +192,11 @@ def main(args=None):
 
         # Deploy
         metadata: dict = {}
+        code_versions, code_commits = get_config_code_versions(config)
         for code in ["e3nn", "nequip", "torch"]:
-            metadata[code + "_version"] = config[code + "_version"]
+            metadata[code + "_version"] = code_versions[code]
+        if len(code_commits) > 0:
+            metadata[CODE_COMMITS_KEY] = code_commits
 
         metadata[R_MAX_KEY] = str(float(config["r_max"]))
         if "allowed_species" in config:

From b24e47c8eebd2ee739cfe9da12452a943ed6cc62 Mon Sep 17 00:00:00 2001
From: Linux-cpp-lisp <1473644+Linux-cpp-lisp@users.noreply.github.com>
Date: Sun, 6 Feb 2022 15:38:59 -0500
Subject: [PATCH 09/53] bugfixes

---
 nequip/scripts/deploy.py   | 10 +++++++---
 nequip/scripts/evaluate.py |  3 +--
 nequip/utils/versions.py   |  2 +-
 3 files changed, 9 insertions(+), 6 deletions(-)

diff --git a/nequip/scripts/deploy.py b/nequip/scripts/deploy.py
index 8348a8a9..736de9a4 100644
--- a/nequip/scripts/deploy.py
+++ b/nequip/scripts/deploy.py
@@ -39,6 +39,8 @@
 _ALL_METADATA_KEYS = [
     CONFIG_KEY,
     NEQUIP_VERSION_KEY,
+    TORCH_VERSION_KEY,
+    E3NN_VERSION_KEY,
     R_MAX_KEY,
     N_SPECIES_KEY,
     TYPE_NAMES_KEY,
@@ -193,10 +195,12 @@ def main(args=None):
         # Deploy
         metadata: dict = {}
         code_versions, code_commits = get_config_code_versions(config)
-        for code in ["e3nn", "nequip", "torch"]:
-            metadata[code + "_version"] = code_versions[code]
+        for code, version in code_versions.items():
+            metadata[code + "_version"] = version
         if len(code_commits) > 0:
-            metadata[CODE_COMMITS_KEY] = code_commits
+            metadata[CODE_COMMITS_KEY] = ";".join(
+                f"{k}={v}" for k, v in code_commits.items()
+            )
 
         metadata[R_MAX_KEY] = str(float(config["r_max"]))
         if "allowed_species" in config:
diff --git a/nequip/scripts/evaluate.py b/nequip/scripts/evaluate.py
index 9604e77d..c4e2db19 100644
--- a/nequip/scripts/evaluate.py
+++ b/nequip/scripts/evaluate.py
@@ -197,9 +197,8 @@ def main(args=None, running_as_script: bool = True):
         global_config = args.model.parent / "config.yaml"
         global_config = Config.from_file(str(global_config), defaults=default_config)
         _set_global_options(global_config)
-        del global_config
-
         check_code_version(global_config)
+        del global_config
 
         # load a training session model
         model, model_config = Trainer.load_model_from_training_session(
diff --git a/nequip/utils/versions.py b/nequip/utils/versions.py
index fe751600..4401f3f0 100644
--- a/nequip/utils/versions.py
+++ b/nequip/utils/versions.py
@@ -67,6 +67,6 @@ def check_code_version(config, add_to_config: bool = False):
             )
 
     if add_to_config:
-        for code, version in code_versions.items():
+        for code, version in current_code_versions.items():
             config[f"{code}_version"] = version
         config[CODE_COMMITS_KEY] = current_code_commits

From 3351e34d49f0c3c61ce00dc059373c4bcd2f9349 Mon Sep 17 00:00:00 2001
From: Linux-cpp-lisp <1473644+Linux-cpp-lisp@users.noreply.github.com>
Date: Sun, 6 Feb 2022 16:10:43 -0500
Subject: [PATCH 10/53] check p value for sanity

---
 nequip/nn/cutoffs.py | 5 +++--
 1 file changed, 3 insertions(+), 2 deletions(-)

diff --git a/nequip/nn/cutoffs.py b/nequip/nn/cutoffs.py
index 7deb7a7a..baf3801e 100644
--- a/nequip/nn/cutoffs.py
+++ b/nequip/nn/cutoffs.py
@@ -30,8 +30,9 @@ def __init__(self, r_max: float, p: float = 6):
             Power used in envelope function
         """
         super().__init__()
-        self.p = p
-        self._factor = 1.0 / r_max
+        assert p > 0.0
+        self.p = float(p)
+        self._factor = 1.0 / float(r_max)
 
     def forward(self, x):
         """

From 252882d7fc6c0b6df645152edecf03df7f5a01a0 Mon Sep 17 00:00:00 2001
From: Linux-cpp-lisp <1473644+Linux-cpp-lisp@users.noreply.github.com>
Date: Tue, 8 Feb 2022 11:40:32 -0500
Subject: [PATCH 11/53] sane minimal p

---
 nequip/nn/cutoffs.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/nequip/nn/cutoffs.py b/nequip/nn/cutoffs.py
index baf3801e..ea79bfa1 100644
--- a/nequip/nn/cutoffs.py
+++ b/nequip/nn/cutoffs.py
@@ -30,7 +30,7 @@ def __init__(self, r_max: float, p: float = 6):
             Power used in envelope function
         """
         super().__init__()
-        assert p > 0.0
+        assert p >= 2.0
         self.p = float(p)
         self._factor = 1.0 / float(r_max)
 

From d174a296d11b06b3beec622a4cf97b2ab9eaa53d Mon Sep 17 00:00:00 2001
From: Linux-cpp-lisp <1473644+Linux-cpp-lisp@users.noreply.github.com>
Date: Tue, 8 Feb 2022 13:28:08 -0500
Subject: [PATCH 12/53] better error

---
 nequip/data/AtomicData.py | 22 +++++++++-------------
 1 file changed, 9 insertions(+), 13 deletions(-)

diff --git a/nequip/data/AtomicData.py b/nequip/data/AtomicData.py
index bb23923e..4848b041 100644
--- a/nequip/data/AtomicData.py
+++ b/nequip/data/AtomicData.py
@@ -477,20 +477,16 @@ def to_ase(
         force = getattr(self, AtomicDataDict.FORCE_KEY, None)
         do_calc = energy is not None or force is not None
 
+        # exclude those that are special for ASE and that we process seperately
+        special_handling_keys = [
+            AtomicDataDict.POSITIONS_KEY,
+            AtomicDataDict.CELL_KEY,
+            AtomicDataDict.PBC_KEY,
+            AtomicDataDict.ATOMIC_NUMBERS_KEY,
+        ] + AtomicDataDict.ALL_ENERGY_KEYS
         assert (
-            len(
-                set(extra_fields).intersection(
-                    [  # exclude those that are special for ASE and that we process seperately
-                        AtomicDataDict.POSITIONS_KEY,
-                        AtomicDataDict.CELL_KEY,
-                        AtomicDataDict.PBC_KEY,
-                        AtomicDataDict.ATOMIC_NUMBERS_KEY,
-                    ]
-                    + AtomicDataDict.ALL_ENERGY_KEYS
-                )
-            )
-            == 0
-        ), "Cannot specify typical keys as `extra_fields` for atoms output"
+            len(set(extra_fields).intersection(special_handling_keys)) == 0
+        ), f"Cannot specify keys handled in special ways ({special_handling_keys}) as `extra_fields` for atoms output--- they are output by default"
 
         if cell is not None:
             cell = cell.view(-1, 3, 3)

From f4c6f03edb613d41ef2b241a762db28d6aac0cd6 Mon Sep 17 00:00:00 2001
From: Linux-cpp-lisp <1473644+Linux-cpp-lisp@users.noreply.github.com>
Date: Wed, 9 Feb 2022 13:10:30 -0500
Subject: [PATCH 13/53] repeat option

---
 CHANGELOG.md               |  2 ++
 nequip/scripts/evaluate.py | 12 ++++++++++++
 2 files changed, 14 insertions(+)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index 1cfbfa41..400c0dac 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -8,6 +8,8 @@ Most recent change on the bottom.
 
 
 ## [Unreleased] - 0.5.3
+### Added
+- `nequip-evaluate --repeat` option
 
 ## [0.5.2] - 2022-02-04
 ### Added
diff --git a/nequip/scripts/evaluate.py b/nequip/scripts/evaluate.py
index c4e2db19..1ee65721 100644
--- a/nequip/scripts/evaluate.py
+++ b/nequip/scripts/evaluate.py
@@ -77,6 +77,16 @@ def main(args=None, running_as_script: bool = True):
         type=int,
         default=50,
     )
+    parser.add_argument(
+        "--repeat",
+        help=(
+            "Number of times to repeat evaluating the test dataset. "
+            "This can help compensate for CUDA nondeterminism, or can be used to evaluate error on models whose inference passes are intentionally nondeterministic. "
+            "Note that `--repeat`ed passes over the dataset will also be `--output`ed if an `--output` is specified."
+        ),
+        type=int,
+        default=1,
+    )
     parser.add_argument(
         "--device",
         help="Device to run the model on. If not provided, defaults to CUDA if available and CPU otherwise.",
@@ -286,6 +296,8 @@ def main(args=None, running_as_script: bool = True):
         logger.info(
             f"Using provided test set indexes, yielding a test set size of {len(test_idcs)} frames.",
         )
+    test_idcs = torch.as_tensor(test_idcs, dtype=torch.long)
+    test_idcs = test_idcs.tile((args.repeat,))
 
     # Figure out what metrics we're actually computing
     if do_metrics:

From 7d111900ff18565a19ce84470e1d0f5c629aba30 Mon Sep 17 00:00:00 2001
From: Linux-cpp-lisp <1473644+Linux-cpp-lisp@users.noreply.github.com>
Date: Mon, 14 Feb 2022 14:54:45 -0500
Subject: [PATCH 14/53] fix unbound variable bug

---
 nequip/scripts/evaluate.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/nequip/scripts/evaluate.py b/nequip/scripts/evaluate.py
index 1ee65721..72ea5c38 100644
--- a/nequip/scripts/evaluate.py
+++ b/nequip/scripts/evaluate.py
@@ -256,8 +256,8 @@ def main(args=None, running_as_script: bool = True):
     # this makes no sense if a dataset is given seperately
     if (
         args.test_indexes is None
-        and train_idcs is not None
         and dataset_is_from_training
+        and train_idcs is not None
     ):
         # we know the train and val, get the rest
         all_idcs = set(range(len(dataset)))

From b8d55fce1ca04c239f09e26aabf36590587d9dc3 Mon Sep 17 00:00:00 2001
From: Linux-cpp-lisp <1473644+Linux-cpp-lisp@users.noreply.github.com>
Date: Mon, 14 Feb 2022 15:24:53 -0500
Subject: [PATCH 15/53] use_deterministic_algorithms

---
 CHANGELOG.md            | 1 +
 nequip/scripts/train.py | 5 +++++
 2 files changed, 6 insertions(+)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index 400c0dac..1a31fdcc 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -10,6 +10,7 @@ Most recent change on the bottom.
 ## [Unreleased] - 0.5.3
 ### Added
 - `nequip-evaluate --repeat` option
+- `torch_use_deterministic_algorithms` options
 
 ## [0.5.2] - 2022-02-04
 ### Added
diff --git a/nequip/scripts/train.py b/nequip/scripts/train.py
index f67f77b2..c6384559 100644
--- a/nequip/scripts/train.py
+++ b/nequip/scripts/train.py
@@ -128,6 +128,11 @@ def _set_global_options(config):
     if config.grad_anomaly_mode:
         torch.autograd.set_detect_anomaly(True)
 
+    # this won't work for most of our models, but could be useful for computing metrics deterministically on CPU
+    use_det_algos = config.get("torch_use_deterministic_algorithms", False)
+    if use_det_algos:
+        torch.use_deterministic_algorithms(use_det_algos)
+
     e3nn.set_optimization_defaults(**config.get("e3nn_optimization_defaults", {}))
 
     # Register fields:

From c98c58b4b879c126aa2985f3e00927b1c77f1085 Mon Sep 17 00:00:00 2001
From: Linux-cpp-lisp <1473644+Linux-cpp-lisp@users.noreply.github.com>
Date: Mon, 14 Feb 2022 15:27:52 -0500
Subject: [PATCH 16/53] Revert "use_deterministic_algorithms"

This reverts commit b8d55fce1ca04c239f09e26aabf36590587d9dc3.
---
 CHANGELOG.md            | 1 -
 nequip/scripts/train.py | 5 -----
 2 files changed, 6 deletions(-)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index 1a31fdcc..400c0dac 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -10,7 +10,6 @@ Most recent change on the bottom.
 ## [Unreleased] - 0.5.3
 ### Added
 - `nequip-evaluate --repeat` option
-- `torch_use_deterministic_algorithms` options
 
 ## [0.5.2] - 2022-02-04
 ### Added
diff --git a/nequip/scripts/train.py b/nequip/scripts/train.py
index c6384559..f67f77b2 100644
--- a/nequip/scripts/train.py
+++ b/nequip/scripts/train.py
@@ -128,11 +128,6 @@ def _set_global_options(config):
     if config.grad_anomaly_mode:
         torch.autograd.set_detect_anomaly(True)
 
-    # this won't work for most of our models, but could be useful for computing metrics deterministically on CPU
-    use_det_algos = config.get("torch_use_deterministic_algorithms", False)
-    if use_det_algos:
-        torch.use_deterministic_algorithms(use_det_algos)
-
     e3nn.set_optimization_defaults(**config.get("e3nn_optimization_defaults", {}))
 
     # Register fields:

From 5c2d4f0ed25bd2d18a7f205066da869e3dd61002 Mon Sep 17 00:00:00 2001
From: Linux-cpp-lisp <1473644+Linux-cpp-lisp@users.noreply.github.com>
Date: Mon, 14 Feb 2022 15:30:26 -0500
Subject: [PATCH 17/53] use_deterministic_algorithms in evaluate

---
 nequip/scripts/evaluate.py | 12 ++++++++++++
 1 file changed, 12 insertions(+)

diff --git a/nequip/scripts/evaluate.py b/nequip/scripts/evaluate.py
index 72ea5c38..329e1ec8 100644
--- a/nequip/scripts/evaluate.py
+++ b/nequip/scripts/evaluate.py
@@ -87,6 +87,12 @@ def main(args=None, running_as_script: bool = True):
         type=int,
         default=1,
     )
+    parser.add_argument(
+        "--use-deterministic-algorithms",
+        help="Try to have PyTorch use deterministic algorithms. Will probably fail on GPU/CUDA.",
+        type=bool,
+        default=False,
+    )
     parser.add_argument(
         "--device",
         help="Device to run the model on. If not provided, defaults to CUDA if available and CPU otherwise.",
@@ -181,6 +187,12 @@ def main(args=None, running_as_script: bool = True):
             "WARNING: please note that models running on CUDA are usually nondeterministc and that this manifests in the final test errors; for a _more_ deterministic result, please use `--device cpu`",
         )
 
+    if args.use_deterministic_algorithms:
+        logger.info(
+            "Telling PyTorch to try to use deterministic algorithms... please note that this will likely error on CUDA/GPU"
+        )
+        torch.use_deterministic_algorithms(True)
+
     # Load model:
     logger.info("Loading model... ")
     loaded_deployed_model: bool = False

From f2859ddfd820e9f3bd5f637b85c1881ae0b9007d Mon Sep 17 00:00:00 2001
From: Linux-cpp-lisp <1473644+Linux-cpp-lisp@users.noreply.github.com>
Date: Mon, 14 Feb 2022 17:17:34 -0500
Subject: [PATCH 18/53] changed default for report_init_validation

---
 CHANGELOG.md            | 3 +++
 nequip/train/trainer.py | 2 +-
 2 files changed, 4 insertions(+), 1 deletion(-)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index 400c0dac..5a9772f9 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -11,6 +11,9 @@ Most recent change on the bottom.
 ### Added
 - `nequip-evaluate --repeat` option
 
+### Changed
+- default value for `report_init_validation` is now `True`
+
 ## [0.5.2] - 2022-02-04
 ### Added
 - Model builders may now process only the configuration
diff --git a/nequip/train/trainer.py b/nequip/train/trainer.py
index 63288cdd..5dcd557d 100644
--- a/nequip/train/trainer.py
+++ b/nequip/train/trainer.py
@@ -252,7 +252,7 @@ def __init__(
         log_epoch_freq: int = 1,
         save_checkpoint_freq: int = -1,
         save_ema_checkpoint_freq: int = -1,
-        report_init_validation: bool = False,
+        report_init_validation: bool = True,
         verbose="INFO",
         **kwargs,
     ):

From 2ec3b37e248cc8b83f8b2602cc0d547685d2e8d9 Mon Sep 17 00:00:00 2001
From: Linux-cpp-lisp <1473644+Linux-cpp-lisp@users.noreply.github.com>
Date: Tue, 15 Feb 2022 11:05:05 -0500
Subject: [PATCH 19/53] show type names in info output

---
 nequip/data/transforms.py | 19 +++++++++++++++++++
 nequip/model/_scaling.py  |  5 ++++-
 2 files changed, 23 insertions(+), 1 deletion(-)

diff --git a/nequip/data/transforms.py b/nequip/data/transforms.py
index 68ad6bcc..90c0c588 100644
--- a/nequip/data/transforms.py
+++ b/nequip/data/transforms.py
@@ -130,3 +130,22 @@ def untransform(self, atom_types):
     @property
     def has_chemical_symbols(self) -> bool:
         return self.chemical_symbol_to_type is not None
+
+    @staticmethod
+    def format(
+        data: list, type_names: List[str], element_formatter: str = ".6f"
+    ) -> str:
+        data = torch.as_tensor(data)
+        if data.ndim == 0:
+            return (f"[{', '.join(type_names)}: {{:{element_formatter}}}]").format(data)
+        elif data.ndim == 1 and len(data) == len(type_names):
+            return (
+                "["
+                + ", ".join(
+                    f"{{{i}[0]}}: {{{i}[1]:{element_formatter}}}"
+                    for i in range(len(data))
+                )
+                + "]"
+            ).format(*zip(type_names, data))
+        else:
+            raise ValueError
diff --git a/nequip/model/_scaling.py b/nequip/model/_scaling.py
index bcd31e1e..3c3a95df 100644
--- a/nequip/model/_scaling.py
+++ b/nequip/model/_scaling.py
@@ -5,6 +5,7 @@
 
 from nequip.nn import RescaleOutput, GraphModuleMixin, PerSpeciesScaleShift
 from nequip.data import AtomicDataDict, AtomicDataset
+from nequip.data.transforms import TypeMapper
 
 
 RESCALE_THRESHOLD = 1e-6
@@ -242,7 +243,9 @@ def PerSpeciesRescale(
         params=params,
     )
 
-    logging.info(f"Atomic outputs are scaled by: {scales}, shifted by {shifts}.")
+    logging.info(
+        f"Atomic outputs are scaled by: {TypeMapper.format(scales, config.type_names)}, shifted by {TypeMapper.format(shifts, config.type_names)}."
+    )
 
     # == Build the model ==
     return model

From 42b5522c5a76edc518993ac0fd140146d2d8e92c Mon Sep 17 00:00:00 2001
From: Linux-cpp-lisp <1473644+Linux-cpp-lisp@users.noreply.github.com>
Date: Tue, 15 Feb 2022 11:15:37 -0500
Subject: [PATCH 20/53] print with type names in debug perspecies

---
 nequip/nn/_atomwise.py | 11 ++++++++---
 1 file changed, 8 insertions(+), 3 deletions(-)

diff --git a/nequip/nn/_atomwise.py b/nequip/nn/_atomwise.py
index a4a1dba1..db65ac0c 100644
--- a/nequip/nn/_atomwise.py
+++ b/nequip/nn/_atomwise.py
@@ -8,6 +8,7 @@
 from e3nn.o3 import Linear
 
 from nequip.data import AtomicDataDict
+from nequip.data.transforms import TypeMapper
 from ._graph_mixin import GraphModuleMixin
 
 
@@ -109,6 +110,7 @@ def __init__(
         self,
         field: str,
         num_types: int,
+        type_names: List[str],
         shifts: Optional[List[float]],
         scales: Optional[List[float]],
         arguments_in_dataset_units: bool,
@@ -119,6 +121,7 @@ def __init__(
     ):
         super().__init__()
         self.num_types = num_types
+        self.type_names = type_names
         self.field = field
         self.out_field = f"shifted_{field}" if out_field is None else out_field
         self._init_irreps(
@@ -176,8 +179,9 @@ def update_for_rescale(self, rescale_module):
                 return
         if self.arguments_in_dataset_units and rescale_module.has_scale:
             logging.debug(
-                f"PerSpeciesScaleShift's arguments were in dataset units; rescaling:\n"
-                f"Original scales {self.scales if self.has_scales else 'n/a'} shifts: {self.shifts if self.has_shifts else 'n/a'}"
+                f"PerSpeciesScaleShift's arguments were in dataset units; rescaling:\n  "
+                f"Original scales: {TypeMapper.format(self.scales, self.type_names) if self.has_scales else 'n/a'} "
+                f"shifts: {TypeMapper.format(self.shifts, self.type_names) if self.has_shifts else 'n/a'}"
             )
             with torch.no_grad():
                 if self.has_scales:
@@ -185,5 +189,6 @@ def update_for_rescale(self, rescale_module):
                 if self.has_shifts:
                     self.shifts.div_(rescale_module.scale_by)
             logging.debug(
-                f"New scales {self.scales if self.has_scales else 'n/a'} shifts: {self.shifts if self.has_shifts else 'n/a'}"
+                f"  New scales: {TypeMapper.format(self.scales, self.type_names) if self.has_scales else 'n/a'} "
+                f"shifts: {TypeMapper.format(self.shifts, self.type_names) if self.has_shifts else 'n/a'}"
             )

From b56517b42b04e7506f07f0ba8523c7fe17a268b8 Mon Sep 17 00:00:00 2001
From: Linux-cpp-lisp <1473644+Linux-cpp-lisp@users.noreply.github.com>
Date: Tue, 15 Feb 2022 11:38:23 -0500
Subject: [PATCH 21/53] type names in per species loss

---
 nequip/scripts/evaluate.py | 8 ++++++--
 nequip/train/trainer.py    | 9 ++-------
 2 files changed, 8 insertions(+), 9 deletions(-)

diff --git a/nequip/scripts/evaluate.py b/nequip/scripts/evaluate.py
index 329e1ec8..12c521c6 100644
--- a/nequip/scripts/evaluate.py
+++ b/nequip/scripts/evaluate.py
@@ -401,7 +401,8 @@ def main(args=None, running_as_script: bool = True):
                         " | ".join(
                             f"{k} = {v:4.4f}"
                             for k, v in metrics.flatten_metrics(
-                                metrics.current_result()
+                                metrics.current_result(),
+                                type_names=dataset.type_mapper.type_names,
                             )[0].items()
                         )
                     )
@@ -418,7 +419,10 @@ def main(args=None, running_as_script: bool = True):
         logger.critical(
             "\n".join(
                 f"{k:>20s} = {v:< 20f}"
-                for k, v in metrics.flatten_metrics(metrics.current_result())[0].items()
+                for k, v in metrics.flatten_metrics(
+                    metrics.current_result(),
+                    type_names=dataset.type_mapper.type_names,
+                )[0].items()
             )
         )
 
diff --git a/nequip/train/trainer.py b/nequip/train/trainer.py
index 5dcd557d..f7a9b3e4 100644
--- a/nequip/train/trainer.py
+++ b/nequip/train/trainer.py
@@ -943,10 +943,7 @@ def end_of_batch_log(self, batch_type: str):
         # append details from metrics
         metrics, skip_keys = self.metrics.flatten_metrics(
             metrics=self.batch_metrics,
-            # TO DO, how about chemical to symbol
-            type_names=self.model.config.get("type_names")
-            if hasattr(self.model, "config")
-            else None,
+            type_names=self.dataset_train.type_mapper.type_names,
         )
         for key, value in metrics.items():
 
@@ -1067,9 +1064,7 @@ def end_of_epoch_log(self):
 
             met, skip_keys = self.metrics.flatten_metrics(
                 metrics=self.metrics_dict[category],
-                type_names=self.model.config.get("type_names")
-                if hasattr(self.model, "config")
-                else None,
+                type_names=self.dataset_train.type_mapper.type_names,
             )
 
             # append details from loss

From 9bc4b6f1a21f3487adab58876f0845b761baf2b6 Mon Sep 17 00:00:00 2001
From: Linux-cpp-lisp <1473644+Linux-cpp-lisp@users.noreply.github.com>
Date: Tue, 15 Feb 2022 11:49:51 -0500
Subject: [PATCH 22/53] fix test

---
 tests/unit/nn/test_atomic.py | 1 +
 1 file changed, 1 insertion(+)

diff --git a/tests/unit/nn/test_atomic.py b/tests/unit/nn/test_atomic.py
index 3b00f7ae..e2897248 100644
--- a/tests/unit/nn/test_atomic.py
+++ b/tests/unit/nn/test_atomic.py
@@ -21,6 +21,7 @@ def model(float_tolerance, request):
     shifts[zero_species] = 0
     params = dict(
         num_types=3,
+        type_names=["A", "B", "C"],
         total_shift=1.0,
         shifts=shifts,
     )

From 693190bd78f2a68f56f0f34fd78eb0de5dc5d8d7 Mon Sep 17 00:00:00 2001
From: Linux-cpp-lisp <1473644+Linux-cpp-lisp@users.noreply.github.com>
Date: Wed, 16 Feb 2022 12:06:35 -0500
Subject: [PATCH 23/53] warn on both global and local shift

---
 nequip/model/_scaling.py | 23 +++++++++++++++++++++--
 1 file changed, 21 insertions(+), 2 deletions(-)

diff --git a/nequip/model/_scaling.py b/nequip/model/_scaling.py
index 3c3a95df..1fd42815 100644
--- a/nequip/model/_scaling.py
+++ b/nequip/model/_scaling.py
@@ -14,6 +14,25 @@
 def RescaleEnergyEtc(
     model: GraphModuleMixin, config, dataset: AtomicDataset, initialize: bool
 ):
+    # Check for common double shift mistake with defaults
+    if "PerSpeciesRescale" in config.get("model_builders", []):
+        # if the defaults are enabled, then we will get bad double shift
+        # THIS CHECK IS ONLY GOOD ENOUGH FOR EMITTING WARNINGS
+        has_global_shift = config.get("global_rescale_shift", None) is not None
+        k = "per_species_rescale_shifts"
+        if has_global_shift:
+            if k not in config:
+                # using default of per_atom shift
+                raise RuntimeError(
+                    "A global_rescale_shift was provided, but the default per-atom energy shift was not disabled."
+                )
+            else:
+                if config[k] is not None:
+                    logging.warn(
+                        "A global shift was enabled, but a per-species shift was _also_ enabled. Please make sure this is what you meant!"
+                    )
+
+        del has_global_shift, k
 
     return GlobalRescale(
         model=model,
@@ -56,7 +75,7 @@ def GlobalRescale(
     if global_shift is not None:
         logging.warning(
             f"!!!! Careful global_shift is set to {global_shift}."
-            f"The energy model will no longer be extensive"
+            f"The model for {default_shift_keys} will no longer be size extensive"
         )
 
     # = Get statistics of training dataset =
@@ -96,7 +115,7 @@ def GlobalRescale(
                 f"Global energy scaling was very low: {global_scale}. If dataset values were used, does the dataset contain insufficient variation? Maybe try disabling global scaling with global_scale=None."
             )
 
-        logging.debug(
+        logging.info(
             f"Initially outputs are globally scaled by: {global_scale}, total_energy are globally shifted by {global_shift}."
         )
 

From 35d8b18df2215e662f770651bb63bc9e7d5ebc07 Mon Sep 17 00:00:00 2001
From: Linux-cpp-lisp <1473644+Linux-cpp-lisp@users.noreply.github.com>
Date: Wed, 16 Feb 2022 13:17:20 -0500
Subject: [PATCH 24/53] allow printing none

---
 nequip/data/transforms.py | 6 ++++--
 1 file changed, 4 insertions(+), 2 deletions(-)

diff --git a/nequip/data/transforms.py b/nequip/data/transforms.py
index 90c0c588..b5c77a32 100644
--- a/nequip/data/transforms.py
+++ b/nequip/data/transforms.py
@@ -135,8 +135,10 @@ def has_chemical_symbols(self) -> bool:
     def format(
         data: list, type_names: List[str], element_formatter: str = ".6f"
     ) -> str:
-        data = torch.as_tensor(data)
-        if data.ndim == 0:
+        data = torch.as_tensor(data) if data is not None else None
+        if data is None:
+            return f"[{', '.join(type_names)}: None]"
+        elif data.ndim == 0:
             return (f"[{', '.join(type_names)}: {{:{element_formatter}}}]").format(data)
         elif data.ndim == 1 and len(data) == len(type_names):
             return (

From 6c6bff2a61c81733c843332ce033256fb15af1c5 Mon Sep 17 00:00:00 2001
From: Linux-cpp-lisp <1473644+Linux-cpp-lisp@users.noreply.github.com>
Date: Wed, 16 Feb 2022 13:17:43 -0500
Subject: [PATCH 25/53] move check to per species

---
 nequip/model/_scaling.py | 33 +++++++++++++--------------------
 1 file changed, 13 insertions(+), 20 deletions(-)

diff --git a/nequip/model/_scaling.py b/nequip/model/_scaling.py
index 1fd42815..dba8aa35 100644
--- a/nequip/model/_scaling.py
+++ b/nequip/model/_scaling.py
@@ -14,26 +14,6 @@
 def RescaleEnergyEtc(
     model: GraphModuleMixin, config, dataset: AtomicDataset, initialize: bool
 ):
-    # Check for common double shift mistake with defaults
-    if "PerSpeciesRescale" in config.get("model_builders", []):
-        # if the defaults are enabled, then we will get bad double shift
-        # THIS CHECK IS ONLY GOOD ENOUGH FOR EMITTING WARNINGS
-        has_global_shift = config.get("global_rescale_shift", None) is not None
-        k = "per_species_rescale_shifts"
-        if has_global_shift:
-            if k not in config:
-                # using default of per_atom shift
-                raise RuntimeError(
-                    "A global_rescale_shift was provided, but the default per-atom energy shift was not disabled."
-                )
-            else:
-                if config[k] is not None:
-                    logging.warn(
-                        "A global shift was enabled, but a per-species shift was _also_ enabled. Please make sure this is what you meant!"
-                    )
-
-        del has_global_shift, k
-
     return GlobalRescale(
         model=model,
         config=config,
@@ -173,6 +153,19 @@ def PerSpeciesRescale(
         f"dataset_per_atom_{AtomicDataDict.TOTAL_ENERGY_KEY}_mean",
     )
 
+    # Check for common double shift mistake with defaults
+    if "RescaleEnergyEtc" in config.get("model_builders", []):
+        # if the defaults are enabled, then we will get bad double shift
+        # THIS CHECK IS ONLY GOOD ENOUGH FOR EMITTING WARNINGS
+        has_global_shift = config.get("global_rescale_shift", None) is not None
+        if has_global_shift:
+            if shifts is not None:
+                # using default of per_atom shift
+                raise RuntimeError(
+                    "A global_rescale_shift was provided, but the default per-atom energy shift was not disabled."
+                )
+        del has_global_shift
+
     # = Determine what statistics need to be compute =\
     arguments_in_dataset_units = None
     if initialize:

From 8b4f3df6006d23b7fdc1b84a9307eeba45fecfa1 Mon Sep 17 00:00:00 2001
From: Linux-cpp-lisp <1473644+Linux-cpp-lisp@users.noreply.github.com>
Date: Wed, 16 Feb 2022 13:19:56 -0500
Subject: [PATCH 26/53] changelog

---
 CHANGELOG.md | 3 +++
 1 file changed, 3 insertions(+)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index 5a9772f9..4f230cbc 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -14,6 +14,9 @@ Most recent change on the bottom.
 ### Changed
 - default value for `report_init_validation` is now `True`
 
+### Fixed
+- error if both per-species and global shift are used together
+
 ## [0.5.2] - 2022-02-04
 ### Added
 - Model builders may now process only the configuration

From 882fd22041f9975151576780d48695449b3d7c68 Mon Sep 17 00:00:00 2001
From: Linux-cpp-lisp <1473644+Linux-cpp-lisp@users.noreply.github.com>
Date: Fri, 18 Feb 2022 14:45:24 -0500
Subject: [PATCH 27/53] test forces on calculator too

---
 tests/integration/test_deploy.py | 35 +++++++++++++++++++++++---------
 1 file changed, 25 insertions(+), 10 deletions(-)

diff --git a/tests/integration/test_deploy.py b/tests/integration/test_deploy.py
index e132e413..2d42ba2a 100644
--- a/tests/integration/test_deploy.py
+++ b/tests/integration/test_deploy.py
@@ -20,11 +20,14 @@
 )
 def test_deploy(nequip_dataset, BENCHMARK_ROOT, device):
     dtype = str(torch.get_default_dtype())[len("torch.") :]
+    atol = {"float32": 1e-5, "float64": 1e-7}[dtype]
 
     # if torch.cuda.is_available():
     #     # TODO: is this true?
     #     pytest.skip("CUDA and subprocesses have issues")
 
+    keys = [AtomicDataDict.TOTAL_ENERGY_KEY, AtomicDataDict.FORCE_KEY]
+
     config_path = pathlib.Path(__file__).parents[2] / "configs/minimal.yaml"
     true_config = yaml.load(config_path.read_text(), Loader=yaml.Loader)
     with tempfile.TemporaryDirectory() as tmpdir:
@@ -65,11 +68,10 @@ def test_deploy(nequip_dataset, BENCHMARK_ROOT, device):
         best_mod.eval()
 
         data = AtomicData.to_AtomicDataDict(nequip_dataset[0].to(device))
-        # Needed because of debug mode:
-        data[AtomicDataDict.TOTAL_ENERGY_KEY] = data[
-            AtomicDataDict.TOTAL_ENERGY_KEY
-        ].unsqueeze(0)
-        train_pred = best_mod(data)[AtomicDataDict.TOTAL_ENERGY_KEY].to("cpu")
+        for k in keys:
+            data.pop(k)
+        train_pred = best_mod(data)
+        train_pred = {k: train_pred[k].to("cpu") for k in keys}
 
         # load model and check that metadata saved
         # TODO: use both CPU and CUDA to load?
@@ -85,8 +87,12 @@ def test_deploy(nequip_dataset, BENCHMARK_ROOT, device):
 
         data_idx = 0
         data = AtomicData.to_AtomicDataDict(nequip_dataset[data_idx].to("cpu"))
-        deploy_pred = deploy_mod(data)[AtomicDataDict.TOTAL_ENERGY_KEY]
-        assert torch.allclose(train_pred, deploy_pred, atol=1e-7)
+        for k in keys:
+            data.pop(k)
+        deploy_pred = deploy_mod(data)
+        deploy_pred = {k: deploy_pred[k].to("cpu") for k in keys}
+        for k in keys:
+            assert torch.allclose(train_pred[k], deploy_pred[k], atol=atol)
 
         # now test info
         # hack for old version
@@ -109,9 +115,18 @@ def test_deploy(nequip_dataset, BENCHMARK_ROOT, device):
             deployed_path,
             device="cpu",
             species_to_type_name={s: s for s in ("C", "H", "O")},
+            set_global_options=False,
         )
         # use .get() so it's not transformed
-        atoms = nequip_dataset.get(data_idx).to_ase()
+        atoms = nequip_dataset.get(nequip_dataset.indices()[data_idx]).to_ase()
         atoms.calc = calc
-        ase_forces = atoms.get_potential_energy()
-        assert torch.allclose(train_pred, torch.as_tensor(ase_forces), atol=1e-7)
+        ase_pred = {
+            AtomicDataDict.TOTAL_ENERGY_KEY: atoms.get_potential_energy(),
+            AtomicDataDict.FORCE_KEY: atoms.get_forces(),
+        }
+        for k in keys:
+            assert torch.allclose(
+                deploy_pred[k],
+                torch.as_tensor(ase_pred[k], dtype=torch.get_default_dtype()),
+                atol=atol,
+            )

From 02d256ef6a723e775d7371f85053b96438e331ea Mon Sep 17 00:00:00 2001
From: Linux-cpp-lisp <1473644+Linux-cpp-lisp@users.noreply.github.com>
Date: Fri, 18 Feb 2022 14:45:31 -0500
Subject: [PATCH 28/53] numpy for total energy (dtype consistancy)

---
 nequip/ase/nequip_calculator.py | 9 ++++++---
 1 file changed, 6 insertions(+), 3 deletions(-)

diff --git a/nequip/ase/nequip_calculator.py b/nequip/ase/nequip_calculator.py
index 11b7f54a..ef14e196 100644
--- a/nequip/ase/nequip_calculator.py
+++ b/nequip/ase/nequip_calculator.py
@@ -103,14 +103,17 @@ def calculate(self, atoms=None, properties=["energy"], system_changes=all_change
 
         # prepare data
         data = AtomicData.from_ase(atoms=atoms, r_max=self.r_max)
+        for k in AtomicDataDict.ALL_ENERGY_KEYS:
+            if k in data:
+                del data[k]
         data = self.transform(data)
-
         data = data.to(self.device)
+        data = AtomicData.to_AtomicDataDict(data)
 
         # predict + extract data
-        out = self.model(AtomicData.to_AtomicDataDict(data))
+        out = self.model(data)
         forces = out[AtomicDataDict.FORCE_KEY].detach().cpu().numpy()
-        energy = out[AtomicDataDict.TOTAL_ENERGY_KEY].detach().cpu().item()
+        energy = out[AtomicDataDict.TOTAL_ENERGY_KEY].detach().cpu().numpy()
 
         # store results
         self.results = {

From 84855472a71214cc46ca1bef11dfce6ab6b78bf2 Mon Sep 17 00:00:00 2001
From: Simon Batzner <simonbatzner@gmail.com>
Date: Sat, 19 Feb 2022 10:40:44 -0500
Subject: [PATCH 29/53] Updated example.yaml + full.yaml with better defaults +
 comments

---
 CHANGELOG.md         |  4 ++
 configs/example.yaml | 54 +++++++++++++++----------
 configs/full.yaml    | 95 +++++++++++++++++++++++++-------------------
 3 files changed, 92 insertions(+), 61 deletions(-)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index 400c0dac..18243229 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -11,6 +11,10 @@ Most recent change on the bottom.
 ### Added
 - `nequip-evaluate --repeat` option
 
+### Changed
+- defaults and commments in example.yaml and full.yaml, in particular longer default training and correct comment for E:F-weighting
+- better metrics config in example.yaml and full.yaml, in particular will total F-MAE/F-RMSE instead of mean over per-species
+
 ## [0.5.2] - 2022-02-04
 ### Added
 - Model builders may now process only the configuration
diff --git a/configs/example.yaml b/configs/example.yaml
index 51bf5a3c..84d1816a 100644
--- a/configs/example.yaml
+++ b/configs/example.yaml
@@ -6,22 +6,23 @@
 # if 'root'/'run_name' exists, 'root'/'run_name'_'year'-'month'-'day'-'hour'-'min'-'s' will be used instead.
 root: results/toluene
 run_name: example-run-toluene
-seed: 123
-dataset_seed: 456                                                                          # random number seed for numpy and torch
+seed: 123                                                                         # model seed
+dataset_seed: 456                                                                 # data set seed
 append: true                                                                      # set true if a restarted run should append to the previous log file
 default_dtype: float32                                                            # type of float to use, e.g. float32 and float64
 
 # network
 r_max: 4.0                                                                        # cutoff radius in length units, here Angstrom, this is an important hyperparamter to scan
-num_layers: 4                                                                     # number of interaction blocks, we find 4-6 to work best
-l_max: 1                                                                          # the maximum irrep order (rotation order) for the network's features
-parity: true                                                                      # whether to include features with odd mirror parity
+num_layers: 4                                                                     # number of interaction blocks, we find 3-5 to work best
+l_max: 1                                                                          # the maximum irrep order (rotation order) for the network's features, l=1 is a good default, l=2 is more accurate but slower
+parity: true                                                                      # whether to include features with odd mirror parity; often turning parity off gives equally good results but faster networks, so do consider this
 num_features: 32                                                                  # the multiplicity of the features
 nonlinearity_type: gate                                                           # may be 'gate' or 'norm', 'gate' is recommended
 
 # scalar nonlinearities to use — available options are silu, ssp (shifted softplus), tanh, and abs.
 # Different nonlinearities are specified for e (even) and o (odd) parity;
-# note that only tanh and abs are correct for o (odd parity).
+# note that only tanh and abs are correct for o (odd parity)
+# silu typically works best
 nonlinearity_scalars:
   e: silu
   o: tanh
@@ -31,14 +32,14 @@ nonlinearity_gates:
   o: tanh
 
 # radial network basis
-num_basis: 8                                                                      # number of basis functions used in the radial basis
+num_basis: 8                                                                      # number of basis functions used in the radial basis, 8 usually works best
 BesselBasis_trainable: true                                                       # set true to train the bessel weights
-PolynomialCutoff_p: 6                                                             # p-exponent used in polynomial cutoff function
+PolynomialCutoff_p: 6                                                             # p-exponent used in polynomial cutoff function, smaller p corresponds to stronger decay with distance
 
 # radial network
 invariant_layers: 2                                                               # number of radial layers, usually 1-3 works best, smaller is faster
 invariant_neurons: 64                                                             # number of hidden neurons in radial function, smaller is faster
-avg_num_neighbors: auto                                                           # number of neighbors to divide by, null => no normalization.
+avg_num_neighbors: auto                                                           # number of neighbors to divide by, null => no normalization, auto computes it based on dataset 
 use_sc: true                                                                      # use self-connection or not, usually gives big improvement
 
 # data set
@@ -63,11 +64,11 @@ chemical_symbols:
   - C
 
 # logging
-wandb: true                                                                       # we recommend using wandb for logging, we'll turn it off here as it's optional
+wandb: true                                                                        # we recommend using wandb for logging
 wandb_project: toluene-example                                                     # project name used in wandb
 
-verbose: info                                                                      # the same as python logging, e.g. warning, info, debug, error. case insensitive
-log_batch_freq: 1000000                                                                  # batch frequency, how often to print training errors withinin the same epoch
+verbose: info                                                                      # the same as python logging, e.g. warning, info, debug, error; case insensitive
+log_batch_freq: 10                                                                 # batch frequency, how often to print training errors withinin the same epoch
 log_epoch_freq: 1                                                                  # epoch frequency, how often to print and save the model
 save_checkpoint_freq: -1                                                           # frequency to save the intermediate checkpoint. no saving when the value is not positive.
 save_ema_checkpoint_freq: -1                                                       # frequency to save the intermediate ema checkpoint. no saving when the value is not positive.
@@ -77,39 +78,50 @@ n_train: 100
 n_val: 50                                                                          # number of validation data
 learning_rate: 0.005                                                               # learning rate, we found values between 0.01 and 0.005 to work best - this is often one of the most important hyperparameters to tune
 batch_size: 5                                                                      # batch size, we found it important to keep this small for most applications including forces (1-5); for energy-only training, higher batch sizes work better
-max_epochs: 100                                                                 # stop training after _ number of epochs, we set a very large number here, it won't take this long in practice and we will use early stopping instead
+max_epochs: 100000                                                                 # stop training after _ number of epochs, we set a very large number here, it won't take this long in practice and we will use early stopping instead
 train_val_split: random                                                            # can be random or sequential. if sequential, first n_train elements are training, next n_val are val, else random, usually random is the right choice
-shuffle: true                                                                      # If true, the data loader will shuffle the data, usually a good idea
+shuffle: true                                                                      # if true, the data loader will shuffle the data, usually a good idea
 metrics_key: validation_loss                                                       # metrics used for scheduling and saving best model. Options: `set`_`quantity`, set can be either "train" or "validation, "quantity" can be loss or anything that appears in the validation batch step header, such as f_mae, f_rmse, e_mae, e_rmse
 use_ema: true                                                                      # if true, use exponential moving average on weights for val/test, usually helps a lot with training, in particular for energy errors
 ema_decay: 0.99                                                                    # ema weight, typically set to 0.99 or 0.999
 ema_use_num_updates: true                                                          # whether to use number of updates when computing averages
+report_init_validation: true                                                       # if True, report the validation error for just initialized model
 
 # early stopping based on metrics values.
 early_stopping_patiences:                                                          # stop early if a metric value stopped decreasing for n epochs
   validation_loss: 50
 
 # loss function
-loss_coeffs:                                                                       # different weights to use in a weighted loss functions
-  forces: 1                                                                        # for MD applications, we recommed a force weight of 100 and an energy weight of 1
-  total_energy:                                                                    # alternatively, if energies are not of importance, a force weight 1 and an energy weight of 0 also works.
+loss_coeffs:                                                                        
+  forces: 1                                                                        # if using PerAtomMSELoss, a default weight of 1:1 on each should work well
+  total_energy:                                                                    
     - 1
     - PerAtomMSELoss
 
 # output metrics
 metrics_components:
+  - - forces                               # key 
+    - mae                                  # "rmse" or "mae"
+  - - forces
+    - rmse
   - - forces
     - mae
-    - PerSpecies: True
-      report_per_component: False
+    - PerSpecies: True                     # if true, per species contribution is counted separately
+      report_per_component: False          # if true, statistics on each component (i.e. fx, fy, fz) will be counted separately
+  - - forces                                
+    - rmse                                  
+    - PerSpecies: True                     
+      report_per_component: False    
+  - - total_energy
+    - mae    
   - - total_energy
     - mae
     - PerAtom: True                        # if true, energy is normalized by the number of atoms
 
 # optimizer, may be any optimizer defined in torch.optim
 # the name `optimizer_name`is case sensitive
-optimizer_name: Adam                                                               # default optimizer is Adam in the amsgrad mode
-optimizer_amsgrad: true
+optimizer_name: Adam                                                               # default optimizer is Adam 
+optimizer_amsgrad: false
 
 # lr scheduler, currently only supports the two options listed below, if you need more please file an issue
 # first: on-plateau, reduce lr by factory of lr_scheduler_factor if metrics_key hasn't improved for lr_scheduler_patience epoch
diff --git a/configs/full.yaml b/configs/full.yaml
index 40544438..42a2eab9 100644
--- a/configs/full.yaml
+++ b/configs/full.yaml
@@ -2,7 +2,7 @@
 
 # This is a full yaml file with all nequip options.
 # It is primarily intented to serve as documentation/reference for all options
-# For a simpler yaml file containing all necessary feature to get you started check out configs/example.yaml
+# For a simpler yaml file containing all necessary features to get you started, we stronlgy recommend to start with configs/example.yaml
 
 # Two folders will be used during the training: 'root'/process and 'root'/'run_name'
 # run_name contains logfiles and saved models
@@ -10,19 +10,19 @@
 # if 'root'/'run_name' exists, 'root'/'run_name'_'year'-'month'-'day'-'hour'-'min'-'s' will be used instead.
 root: results/toluene
 run_name: example-run-toluene
-seed: 123
-dataset_seed: 456                                                                          # random number seed for numpy and torch
+seed: 123                                                                         # model seed
+dataset_seed: 456                                                                 # data set seed
 append: true                                                                      # set true if a restarted run should append to the previous log file
 default_dtype: float32                                                            # type of float to use, e.g. float32 and float64
 allow_tf32: false                                                                 # whether to use TensorFloat32 if it is available
-# device:  cuda                                                                     # which device to use. Default: automatically detected cuda or "cpu"
+# device:  cuda                                                                   # which device to use. Default: automatically detected cuda or "cpu"
 
 # network
 r_max: 4.0                                                                        # cutoff radius in length units, here Angstrom, this is an important hyperparamter to scan
-num_layers: 4                                                                     # number of interaction blocks, we find 4-6 to work best
+num_layers: 4                                                                     # number of interaction blocks, we find 3-5 to work best
 
-l_max: 1                                                                          # the maximum irrep order (rotation order) for the network's features
-parity: true                                                                      # whether to include features with odd mirror parity
+l_max: 1                                                                          # the maximum irrep order (rotation order) for the network's features, l=1 is a good default, l=2 is more accurate but slower
+parity: true                                                                      # whether to include features with odd mirror parityy; often turning parity off gives equally good results but faster networks, so do consider this
 num_features: 32                                                                  # the multiplicity of the features
 
 # alternatively, the irreps of the features in various parts of the network can be specified directly:
@@ -50,14 +50,14 @@ nonlinearity_gates:
   o: tanh
 
 # radial network basis
-num_basis: 8                                                                      # number of basis functions used in the radial basis
+num_basis: 8                                                                      # number of basis functions used in the radial basis, 8 usually works best
 BesselBasis_trainable: true                                                       # set true to train the bessel weights
-PolynomialCutoff_p: 6                                                             # p-exponent used in polynomial cutoff function
+PolynomialCutoff_p: 6                                                             # p-exponent used in polynomial cutoff function, smaller p corresponds to stronger decay with distance
 
 # radial network
 invariant_layers: 2                                                               # number of radial layers, usually 1-3 works best, smaller is faster
 invariant_neurons: 64                                                             # number of hidden neurons in radial function, smaller is faster
-avg_num_neighbors: auto                                                           # number of neighbors to divide by, null => no normalization.
+avg_num_neighbors: auto                                                           # number of neighbors to divide by, null => no normalization, auto computes it based on dataset 
 use_sc: true                                                                      # use self-connection or not, usually gives big improvement
 
 # to specify different parameters for each convolutional layer, try examples below
@@ -66,20 +66,10 @@ use_sc: true
 #   invariant_neurons < InteractionBlock_invariant_neurons < layer{i}_invariant_neurons
 
 # data set
-# the keys used need to be stated at least once in key_mapping, npz_fixed_field_keys or include_keys
-# key_mapping is used to map the key in the npz file to the NequIP default values (see data/_key.py)
-# all arrays are expected to have the shape of (nframe, natom, ?) except the fixed fields
-# note that if your data set uses pbc, you need to also pass an array that maps to the nequip "pbc" key
-dataset: npz                                                                       # type of data set, can be npz or ase
-dataset_url: http://quantum-machine.org/gdml/data/npz/toluene_ccsd_t.zip           # url to download the npz. optional
-dataset_file_name: ./benchmark_data/toluene_ccsd_t-train.npz                       # path to data set file
-key_mapping:
-  z: atomic_numbers                                                                # atomic species, integers
-  E: total_energy                                                                  # total potential eneriges to train to
-  F: forces                                                                        # atomic forces to train to
-  R: pos                                                                           # raw atomic positions
-npz_fixed_field_keys:                                                              # fields that are repeated across different examples
-  - atomic_numbers
+# there are two options to specify a dataset, npz or ase
+# npz works with npz files, ase can ready any format that ase.io.read can read
+# in most cases working with the ase option and an extxyz file is by far the simplest way to do it and we strongly recommend using this
+# simply provide a single extxyz file that contains the structures together with energies and forces (generated with ase.io.write(atoms, format='extxyz', append=True))
 
 # # for extxyz file
 # dataset: ase
@@ -90,7 +80,9 @@ npz_fixed_field_keys:
 #   - user_label
 # key_mapping:
 #   user_label: label0
-# 
+
+
+# alternatively, you can read directly from a VASP OUTCAR file (this will only read that single OUTCAR)
 # # for VASP OUTCAR, the yaml input should be
 # dataset: ase
 # dataset_file_name: OUTCAR
@@ -99,10 +91,27 @@ npz_fixed_field_keys:
 # key_mapping:
 #   free_energy: total_energy
 
+# npz example 
+# the keys used need to be stated at least once in key_mapping, npz_fixed_field_keys or include_keys
+# key_mapping is used to map the key in the npz file to the NequIP default values (see data/_key.py)
+# all arrays are expected to have the shape of (nframe, natom, ?) except the fixed fields
+# note that if your data set uses pbc, you need to also pass an array that maps to the nequip "pbc" key
+dataset: npz                                                                       # type of data set, can be npz or ase
+dataset_url: http://quantum-machine.org/gdml/data/npz/toluene_ccsd_t.zip           # url to download the npz. optional
+dataset_file_name: ./benchmark_data/toluene_ccsd_t-train.npz                       # path to data set file
+key_mapping:
+  z: atomic_numbers                                                                # atomic species, integers
+  E: total_energy                                                                  # total potential eneriges to train to
+  F: forces                                                                        # atomic forces to train to
+  R: pos                                                                           # raw atomic positions
+npz_fixed_field_keys:                                                              # fields that are repeated across different examples
+  - atomic_numbers
+
 # A list of atomic types to be found in the data. The NequIP types will be named with the chemical symbols, and inputs with the correct atomic numbers will be mapped to the corresponding types.
 chemical_symbols:
- - H
- - C
+  - H
+  - C
+
 # Alternatively, you may explicitly specify which chemical species maps to which type in NequIP (type index; the name is still taken from the chemical symbol)
 # chemical_symbol_to_type:
 #   H: 0
@@ -149,14 +158,14 @@ n_train: 100
 n_val: 50                                                                          # number of validation data
 learning_rate: 0.005                                                               # learning rate, we found values between 0.01 and 0.005 to work best - this is often one of the most important hyperparameters to tune
 batch_size: 5                                                                      # batch size, we found it important to keep this small for most applications including forces (1-5); for energy-only training, higher batch sizes work better
-max_epochs: 100000                                                                      # stop training after _ number of epochs, we set a very large number here, it won't take this long in practice and we will use early stopping instead
+max_epochs: 100000                                                                 # stop training after _ number of epochs, we set a very large number here, it won't take this long in practice and we will use early stopping instead
 train_val_split: random                                                            # can be random or sequential. if sequential, first n_train elements are training, next n_val are val, else random, usually random is the right choice
 shuffle: true                                                                      # If true, the data loader will shuffle the data, usually a good idea
-metrics_key: validation_loss                                                        # metrics used for scheduling and saving best model. Options: `set`_`quantity`, set can be either "train" or "validation, "quantity" can be loss or anything that appears in the validation batch step header, such as f_mae, f_rmse, e_mae, e_rmse
+metrics_key: validation_loss                                                       # metrics used for scheduling and saving best model. Options: `set`_`quantity`, set can be either "train" or "validation, "quantity" can be loss or anything that appears in the validation batch step header, such as f_mae, f_rmse, e_mae, e_rmse
 use_ema: true                                                                      # if true, use exponential moving average on weights for val/test, usually helps a lot with training, in particular for energy errors
 ema_decay: 0.99                                                                    # ema weight, typically set to 0.99 or 0.999
 ema_use_num_updates: true                                                          # whether to use number of updates when computing averages
-report_init_validation: false                                                      # if True, report the validation error for just initialized model
+report_init_validation: true                                                       # if True, report the validation error for just initialized model
 
 # early stopping based on metrics values. 
 # LR, wall and any keys printed in the log file can be used. 
@@ -177,8 +186,8 @@ early_stopping_upper_bounds:
 
 # loss function
 loss_coeffs:                                                                       # different weights to use in a weighted loss functions
-  forces: 1                                                                        # for MD applications, we recommed a force weight of 100 and an energy weight of 1
-  total_energy:                                                                    # alternatively, if energies are not of importance, a force weight 1 and an energy weight of 0 also works.
+  forces: 1                                                                        # if using PerAtomMSELoss, a default weight of 1:1 on each should work well
+  total_energy:                                                                    
     - 1
     - PerAtomMSELoss
 
@@ -214,22 +223,28 @@ loss_coeffs:
 
 # output metrics
 metrics_components:
-  - - forces                               # key
-    - rmse                                 # "rmse" or "mse"
-    - PerSpecies: True                     # if true, per species contribution is counted separately
-      report_per_component: False          # if true, statistics on each component (i.e. fx, fy, fz) will be counted separately
+  - - forces                               # key 
+    - mae                                  # "rmse" or "mae"
+  - - forces
+    - rmse
   - - forces
     - mae
-    - PerSpecies: True
-      report_per_component: False
+    - PerSpecies: True                     # if true, per species contribution is counted separately
+      report_per_component: False          # if true, statistics on each component (i.e. fx, fy, fz) will be counted separately
+  - - forces                                
+    - rmse                                  
+    - PerSpecies: True                     
+      report_per_component: False    
+  - - total_energy
+    - mae    
   - - total_energy
     - mae
     - PerAtom: True                        # if true, energy is normalized by the number of atoms
 
 # optimizer, may be any optimizer defined in torch.optim
 # the name `optimizer_name`is case sensitive
-optimizer_name: Adam                                                               # default optimizer is Adam in the amsgrad mode
-optimizer_amsgrad: true
+optimizer_name: Adam                                                               # default optimizer is Adam 
+optimizer_amsgrad: false
 optimizer_betas: !!python/tuple
   - 0.9
   - 0.999

From bc904eb256258532a89ba86ae4d7a1296bcc8bad Mon Sep 17 00:00:00 2001
From: Simon Batzner <simonbatzner@gmail.com>
Date: Sat, 19 Feb 2022 11:57:22 -0500
Subject: [PATCH 30/53] better max_epochs + early stopping

---
 configs/example.yaml | 5 ++++-
 configs/full.yaml    | 2 +-
 2 files changed, 5 insertions(+), 2 deletions(-)

diff --git a/configs/example.yaml b/configs/example.yaml
index 84d1816a..ec335d29 100644
--- a/configs/example.yaml
+++ b/configs/example.yaml
@@ -78,7 +78,7 @@ n_train: 100
 n_val: 50                                                                          # number of validation data
 learning_rate: 0.005                                                               # learning rate, we found values between 0.01 and 0.005 to work best - this is often one of the most important hyperparameters to tune
 batch_size: 5                                                                      # batch size, we found it important to keep this small for most applications including forces (1-5); for energy-only training, higher batch sizes work better
-max_epochs: 100000                                                                 # stop training after _ number of epochs, we set a very large number here, it won't take this long in practice and we will use early stopping instead
+max_epochs: 100                                                                    # stop training after _ number of epochs, we set a small number here to have an example that finished within a few minutes, but in practice we recommend using a very large number, as e.g. 1million and then to just use early stopping and not train the full number of epochs
 train_val_split: random                                                            # can be random or sequential. if sequential, first n_train elements are training, next n_val are val, else random, usually random is the right choice
 shuffle: true                                                                      # if true, the data loader will shuffle the data, usually a good idea
 metrics_key: validation_loss                                                       # metrics used for scheduling and saving best model. Options: `set`_`quantity`, set can be either "train" or "validation, "quantity" can be loss or anything that appears in the validation batch step header, such as f_mae, f_rmse, e_mae, e_rmse
@@ -91,6 +91,9 @@ report_init_validation: true
 early_stopping_patiences:                                                          # stop early if a metric value stopped decreasing for n epochs
   validation_loss: 50
 
+early_stopping_lower_bounds:                                                       # stop early if a metric value is lower than the bound
+  LR: 1.0e-5
+  
 # loss function
 loss_coeffs:                                                                        
   forces: 1                                                                        # if using PerAtomMSELoss, a default weight of 1:1 on each should work well
diff --git a/configs/full.yaml b/configs/full.yaml
index 42a2eab9..2774b1d9 100644
--- a/configs/full.yaml
+++ b/configs/full.yaml
@@ -179,7 +179,7 @@ early_stopping_delta:
 early_stopping_cumulative_delta: false                                             # If True, the minimum value recorded will not be updated when the decrease is smaller than delta
 
 early_stopping_lower_bounds:                                                       # stop early if a metric value is lower than the bound
-  LR: 1.0e-6
+  LR: 1.0e-5
 
 early_stopping_upper_bounds:                                                       # stop early if a metric value is higher than the bound
   wall: 1.0e+100

From 4ac629f58aafa96cf2b575dc6e2988d93b4974cf Mon Sep 17 00:00:00 2001
From: Simon Batzner <simonbatzner@gmail.com>
Date: Sat, 19 Feb 2022 12:04:34 -0500
Subject: [PATCH 31/53] better comments

---
 configs/example.yaml | 10 +++++-----
 configs/full.yaml    |  7 ++++---
 2 files changed, 9 insertions(+), 8 deletions(-)

diff --git a/configs/example.yaml b/configs/example.yaml
index ec335d29..ba780e9e 100644
--- a/configs/example.yaml
+++ b/configs/example.yaml
@@ -16,13 +16,13 @@ r_max: 4.0
 num_layers: 4                                                                     # number of interaction blocks, we find 3-5 to work best
 l_max: 1                                                                          # the maximum irrep order (rotation order) for the network's features, l=1 is a good default, l=2 is more accurate but slower
 parity: true                                                                      # whether to include features with odd mirror parity; often turning parity off gives equally good results but faster networks, so do consider this
-num_features: 32                                                                  # the multiplicity of the features
+num_features: 32                                                                  # the multiplicity of the features, 32 is a good default for accurate network, if you want to be more accurate, go larger, if you want to be faster, go lower
 nonlinearity_type: gate                                                           # may be 'gate' or 'norm', 'gate' is recommended
 
 # scalar nonlinearities to use — available options are silu, ssp (shifted softplus), tanh, and abs.
 # Different nonlinearities are specified for e (even) and o (odd) parity;
 # note that only tanh and abs are correct for o (odd parity)
-# silu typically works best
+# silu typically works best for even 
 nonlinearity_scalars:
   e: silu
   o: tanh
@@ -70,8 +70,8 @@ wandb_project: toluene-example
 verbose: info                                                                      # the same as python logging, e.g. warning, info, debug, error; case insensitive
 log_batch_freq: 10                                                                 # batch frequency, how often to print training errors withinin the same epoch
 log_epoch_freq: 1                                                                  # epoch frequency, how often to print and save the model
-save_checkpoint_freq: -1                                                           # frequency to save the intermediate checkpoint. no saving when the value is not positive.
-save_ema_checkpoint_freq: -1                                                       # frequency to save the intermediate ema checkpoint. no saving when the value is not positive.
+save_checkpoint_freq: -1                                                           # frequency to save the intermediate checkpoint. no saving of intermediate checkpoints when the value is not positive.
+save_ema_checkpoint_freq: -1                                                       # frequency to save the intermediate ema checkpoint. no saving of intermediate checkpoints when the value is not positive.
 
 # training
 n_train: 100                                                                       # number of training data
@@ -93,7 +93,7 @@ early_stopping_patiences:
 
 early_stopping_lower_bounds:                                                       # stop early if a metric value is lower than the bound
   LR: 1.0e-5
-  
+
 # loss function
 loss_coeffs:                                                                        
   forces: 1                                                                        # if using PerAtomMSELoss, a default weight of 1:1 on each should work well
diff --git a/configs/full.yaml b/configs/full.yaml
index 2774b1d9..81c780e5 100644
--- a/configs/full.yaml
+++ b/configs/full.yaml
@@ -23,7 +23,7 @@ num_layers: 4
 
 l_max: 1                                                                          # the maximum irrep order (rotation order) for the network's features, l=1 is a good default, l=2 is more accurate but slower
 parity: true                                                                      # whether to include features with odd mirror parityy; often turning parity off gives equally good results but faster networks, so do consider this
-num_features: 32                                                                  # the multiplicity of the features
+num_features: 32                                                                  # the multiplicity of the features, 32 is a good default for accurate network, if you want to be more accurate, go larger, if you want to be faster, go lower
 
 # alternatively, the irreps of the features in various parts of the network can be specified directly:
 # the following options use e3nn irreps notation
@@ -41,6 +41,7 @@ resnet: false
 # scalar nonlinearities to use — available options are silu, ssp (shifted softplus), tanh, and abs.
 # Different nonlinearities are specified for e (even) and o (odd) parity;
 # note that only tanh and abs are correct for o (odd parity).
+# silu typically works best for even 
 nonlinearity_scalars:
   e: silu
   o: tanh
@@ -150,8 +151,8 @@ wandb_watch: false
 verbose: info                                                                      # the same as python logging, e.g. warning, info, debug, error. case insensitive
 log_batch_freq: 1                                                                  # batch frequency, how often to print training errors withinin the same epoch
 log_epoch_freq: 1                                                                  # epoch frequency, how often to print and save the model
-save_checkpoint_freq: -1                                                           # frequency to save the intermediate checkpoint. no saving when the value is not positive.
-save_ema_checkpoint_freq: -1                                                       # frequency to save the intermediate ema checkpoint. no saving when the value is not positive.
+save_checkpoint_freq: -1                                                           # frequency to save the intermediate checkpoint. no saving of intermediate checkpoints when the value is not positive.
+save_ema_checkpoint_freq: -1                                                       # frequency to save the intermediate ema checkpoint. no saving of intermediate checkpoints when the value is not positive.
 
 # training
 n_train: 100                                                                       # number of training data

From ef019b4785f4d47835ebe05f4eb1627d8f339a87 Mon Sep 17 00:00:00 2001
From: Simon Batzner <simonbatzner@gmail.com>
Date: Sat, 19 Feb 2022 12:10:18 -0500
Subject: [PATCH 32/53] correct docs for lr scheduler

---
 configs/example.yaml | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/configs/example.yaml b/configs/example.yaml
index ba780e9e..e285ac4a 100644
--- a/configs/example.yaml
+++ b/configs/example.yaml
@@ -126,8 +126,8 @@ metrics_components:
 optimizer_name: Adam                                                               # default optimizer is Adam 
 optimizer_amsgrad: false
 
-# lr scheduler, currently only supports the two options listed below, if you need more please file an issue
-# first: on-plateau, reduce lr by factory of lr_scheduler_factor if metrics_key hasn't improved for lr_scheduler_patience epoch
+# lr scheduler, currently only supports the two options listed in full.yaml, i.e. on-pleteau and cosine annealing with warm restarts, if you need more please file an issue
+# here: on-plateau, reduce lr by factory of lr_scheduler_factor if metrics_key hasn't improved for lr_scheduler_patience epoch
 lr_scheduler_name: ReduceLROnPlateau
 lr_scheduler_patience: 100
 lr_scheduler_factor: 0.5

From 1ff745abe3e4d2594292beb21bdaee97f81047cc Mon Sep 17 00:00:00 2001
From: Simon Batzner <simonbatzner@gmail.com>
Date: Sat, 19 Feb 2022 12:12:11 -0500
Subject: [PATCH 33/53] better comments for shift/scales

---
 configs/example.yaml | 10 ++++++----
 1 file changed, 6 insertions(+), 4 deletions(-)

diff --git a/configs/example.yaml b/configs/example.yaml
index e285ac4a..67000f88 100644
--- a/configs/example.yaml
+++ b/configs/example.yaml
@@ -137,15 +137,17 @@ lr_scheduler_factor: 0.5
 # the default is to scale the atomic energy and forces by scaling them by the force standard deviation and to shift the energy by the mean atomic energy
 # in certain cases, it can be useful to have a trainable shift/scale and to also have species-dependent shifts/scales for each atom
 
+# whether the shifts and scales are trainable. Defaults to False. Optional
 per_species_rescale_shifts_trainable: false
 per_species_rescale_scales_trainable: false
 
-# whether the shifts and scales are trainable. Defaults to False. Optional
-per_species_rescale_shifts: dataset_per_atom_total_energy_mean
 # initial atomic energy shift for each species. default to the mean of per atom energy. Optional
 # the value can be a constant float value, an array for each species, or a string that defines a statistics over the training dataset
-per_species_rescale_scales: dataset_forces_rms
+per_species_rescale_shifts: dataset_per_atom_total_energy_mean
+
 # initial atomic energy scale for each species. Optional.
 # the value can be a constant float value, an array for each species, or a string
-# per_species_rescale_arguments_in_dataset_units: True
+per_species_rescale_scales: dataset_forces_rms
+
 # if explicit numbers are given for the shifts/scales, this parameter must specify whether the given numbers are unitless shifts/scales or are in the units of the dataset. If ``True``, any global rescalings will correctly be applied to the per-species values.
+# per_species_rescale_arguments_in_dataset_units: True

From e61d8e1d9146c5d330f06dd9edd7688022c95b5d Mon Sep 17 00:00:00 2001
From: Simon Batzner <simonbatzner@gmail.com>
Date: Sat, 19 Feb 2022 12:56:54 -0500
Subject: [PATCH 34/53] default wandb: true:

---
 configs/full.yaml | 5 +++--
 1 file changed, 3 insertions(+), 2 deletions(-)

diff --git a/configs/full.yaml b/configs/full.yaml
index 81c780e5..f1597287 100644
--- a/configs/full.yaml
+++ b/configs/full.yaml
@@ -2,7 +2,7 @@
 
 # This is a full yaml file with all nequip options.
 # It is primarily intented to serve as documentation/reference for all options
-# For a simpler yaml file containing all necessary features to get you started, we stronlgy recommend to start with configs/example.yaml
+# For a simpler yaml file containing all necessary features to get you started, we strongly recommend to start with configs/example.yaml
 
 # Two folders will be used during the training: 'root'/process and 'root'/'run_name'
 # run_name contains logfiles and saved models
@@ -139,9 +139,10 @@ chemical_symbols:
 # validation_dataset_file_name: xxx.xyz                                            # need to be a format accepted by ase.io.read
 
 # logging
-wandb: false                                                                       # we recommend using wandb for logging, we'll turn it off here as it's optional
+wandb: true                                                                        # we recommend using wandb for logging
 wandb_project: toluene-example                                                     # project name used in wandb
 wandb_watch: false
+
 # see https://docs.wandb.ai/ref/python/watch
 # wandb_watch_kwargs:
 #   log: all

From 2d7518a3ef3716dbdc24013eafad905f3ab13abf Mon Sep 17 00:00:00 2001
From: Simon Batzner <simonbatzner@gmail.com>
Date: Sun, 20 Feb 2022 12:19:35 -0500
Subject: [PATCH 35/53] better type index description

---
 configs/full.yaml | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/configs/full.yaml b/configs/full.yaml
index f1597287..37185ad2 100644
--- a/configs/full.yaml
+++ b/configs/full.yaml
@@ -113,7 +113,8 @@ chemical_symbols:
   - H
   - C
 
-# Alternatively, you may explicitly specify which chemical species maps to which type in NequIP (type index; the name is still taken from the chemical symbol)
+# Alternatively, you may explicitly specify which chemical species in the input will map to NequIP atom type 0, which to atom type 1, and so on.
+# Other than providing an explicit order for the NequIP atom types, this option behaves the same as `chemical_symbols`
 # chemical_symbol_to_type:
 #   H: 0
 #   C: 1

From 5278fd24cafdd2ef402694f631fae62184634563 Mon Sep 17 00:00:00 2001
From: Simon Batzner <simonbatzner@gmail.com>
Date: Sun, 20 Feb 2022 13:49:03 -0500
Subject: [PATCH 36/53] Update configs/full.yaml

---
 configs/full.yaml | 4 +++-
 1 file changed, 3 insertions(+), 1 deletion(-)

diff --git a/configs/full.yaml b/configs/full.yaml
index 37185ad2..090dc1a4 100644
--- a/configs/full.yaml
+++ b/configs/full.yaml
@@ -108,7 +108,9 @@ key_mapping:
 npz_fixed_field_keys:                                                              # fields that are repeated across different examples
   - atomic_numbers
 
-# A list of atomic types to be found in the data. The NequIP types will be named with the chemical symbols, and inputs with the correct atomic numbers will be mapped to the corresponding types.
+# A list of chemical species found in the data. The NequIP atom types will be named after the chemical symbols and ordered by atomic number in ascending order.
+# (In this case, NequIP's internal atom type 0 will be named H and type 1 will be named C.)
+# Atoms in the input will be assigned NequIP atom types according to their atomic numbers.
 chemical_symbols:
   - H
   - C

From 4a2901ece0b96683c7ad291c5a4db556c507dcd4 Mon Sep 17 00:00:00 2001
From: Linux-cpp-lisp <1473644+Linux-cpp-lisp@users.noreply.github.com>
Date: Mon, 21 Feb 2022 15:56:26 -0500
Subject: [PATCH 37/53] all_ -> ps_mean_

---
 CHANGELOG.md            | 1 +
 nequip/train/metrics.py | 2 +-
 2 files changed, 2 insertions(+), 1 deletion(-)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index 4f230cbc..212f1688 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -13,6 +13,7 @@ Most recent change on the bottom.
 
 ### Changed
 - default value for `report_init_validation` is now `True`
+- `all_*_*` metrics rename to -> `ps_mean_*_*`
 
 ### Fixed
 - error if both per-species and global shift are used together
diff --git a/nequip/train/metrics.py b/nequip/train/metrics.py
index c1085e2f..8256c30a 100644
--- a/nequip/train/metrics.py
+++ b/nequip/train/metrics.py
@@ -240,7 +240,7 @@ def flatten_metrics(self, metrics, type_names=None):
                         else:
                             flat_dict[f"{id_ele}_{item_name}"] = v.item()
 
-                    flat_dict[f"all_{item_name}"] = value.mean().item()
+                    flat_dict[f"ps_mean_{item_name}"] = value.mean().item()
                 else:
                     for id_ele, vec in enumerate(value):
                         ele = type_names[id_ele]

From f318448bbab1a88807a6ca6fb0a54cf2572dd81c Mon Sep 17 00:00:00 2001
From: Linux-cpp-lisp <1473644+Linux-cpp-lisp@users.noreply.github.com>
Date: Mon, 21 Feb 2022 16:35:00 -0500
Subject: [PATCH 38/53] test calculator forces

---
 tests/integration/test_deploy.py | 20 ++++++++++++--------
 1 file changed, 12 insertions(+), 8 deletions(-)

diff --git a/tests/integration/test_deploy.py b/tests/integration/test_deploy.py
index 2d42ba2a..e2a6e500 100644
--- a/tests/integration/test_deploy.py
+++ b/tests/integration/test_deploy.py
@@ -9,7 +9,8 @@
 import torch
 
 import nequip
-from nequip.data import AtomicDataDict, AtomicData
+from nequip.data import AtomicDataDict, AtomicData, dataset_from_config
+from nequip.utils import Config
 from nequip.scripts import deploy
 from nequip.train import Trainer
 from nequip.ase import NequIPCalculator
@@ -18,7 +19,7 @@
 @pytest.mark.parametrize(
     "device", ["cpu"] + (["cuda"] if torch.cuda.is_available() else [])
 )
-def test_deploy(nequip_dataset, BENCHMARK_ROOT, device):
+def test_deploy(BENCHMARK_ROOT, device):
     dtype = str(torch.get_default_dtype())[len("torch.") :]
     atol = {"float32": 1e-5, "float64": 1e-7}[dtype]
 
@@ -33,7 +34,7 @@ def test_deploy(nequip_dataset, BENCHMARK_ROOT, device):
     with tempfile.TemporaryDirectory() as tmpdir:
         # Save time
         run_name = "test_deploy" + dtype
-        root = "./"
+        root = tmpdir + "nequip_rootdir/"
         true_config["run_name"] = run_name
         true_config["root"] = root
         true_config["dataset_file_name"] = str(
@@ -44,7 +45,8 @@ def test_deploy(nequip_dataset, BENCHMARK_ROOT, device):
         true_config["n_train"] = 1
         true_config["n_val"] = 1
         config_path = "conf.yaml"
-        with open(f"{tmpdir}/{config_path}", "w+") as fp:
+        full_config_path = f"{tmpdir}/{config_path}"
+        with open(full_config_path, "w+") as fp:
             yaml.dump(true_config, fp)
         # Train model
         retcode = subprocess.run(["nequip-train", str(config_path)], cwd=tmpdir)
@@ -61,13 +63,15 @@ def test_deploy(nequip_dataset, BENCHMARK_ROOT, device):
 
         # now test predictions the same
         best_mod, _ = Trainer.load_model_from_training_session(
-            traindir=f"{tmpdir}/{root}/{run_name}/",
+            traindir=f"{root}/{run_name}/",
             model_name="best_model.pth",
             device=device,
         )
         best_mod.eval()
 
-        data = AtomicData.to_AtomicDataDict(nequip_dataset[0].to(device))
+        # load train dataset, already cached
+        dataset = dataset_from_config(Config.from_file(full_config_path))
+        data = AtomicData.to_AtomicDataDict(dataset[0].to(device))
         for k in keys:
             data.pop(k)
         train_pred = best_mod(data)
@@ -86,7 +90,7 @@ def test_deploy(nequip_dataset, BENCHMARK_ROOT, device):
         assert len(metadata[deploy.TYPE_NAMES_KEY].split(" ")) == 3  # C, H, O
 
         data_idx = 0
-        data = AtomicData.to_AtomicDataDict(nequip_dataset[data_idx].to("cpu"))
+        data = AtomicData.to_AtomicDataDict(dataset[data_idx].to("cpu"))
         for k in keys:
             data.pop(k)
         deploy_pred = deploy_mod(data)
@@ -118,7 +122,7 @@ def test_deploy(nequip_dataset, BENCHMARK_ROOT, device):
             set_global_options=False,
         )
         # use .get() so it's not transformed
-        atoms = nequip_dataset.get(nequip_dataset.indices()[data_idx]).to_ase()
+        atoms = dataset.get(dataset.indices()[data_idx]).to_ase()
         atoms.calc = calc
         ase_pred = {
             AtomicDataDict.TOTAL_ENERGY_KEY: atoms.get_potential_energy(),

From 41d35c49e9a06ffa0045ca38e5ef36c65a4a14f9 Mon Sep 17 00:00:00 2001
From: Simon Batzner <simonbatzner@gmail.com>
Date: Mon, 21 Feb 2022 16:59:48 -0500
Subject: [PATCH 39/53] better epoch_freq docs

---
 configs/example.yaml | 2 +-
 configs/full.yaml    | 2 +-
 2 files changed, 2 insertions(+), 2 deletions(-)

diff --git a/configs/example.yaml b/configs/example.yaml
index 67000f88..20997621 100644
--- a/configs/example.yaml
+++ b/configs/example.yaml
@@ -69,7 +69,7 @@ wandb_project: toluene-example
 
 verbose: info                                                                      # the same as python logging, e.g. warning, info, debug, error; case insensitive
 log_batch_freq: 10                                                                 # batch frequency, how often to print training errors withinin the same epoch
-log_epoch_freq: 1                                                                  # epoch frequency, how often to print and save the model
+log_epoch_freq: 1                                                                  # epoch frequency, how often to print 
 save_checkpoint_freq: -1                                                           # frequency to save the intermediate checkpoint. no saving of intermediate checkpoints when the value is not positive.
 save_ema_checkpoint_freq: -1                                                       # frequency to save the intermediate ema checkpoint. no saving of intermediate checkpoints when the value is not positive.
 
diff --git a/configs/full.yaml b/configs/full.yaml
index 090dc1a4..19e00feb 100644
--- a/configs/full.yaml
+++ b/configs/full.yaml
@@ -154,7 +154,7 @@ wandb_watch: false
 
 verbose: info                                                                      # the same as python logging, e.g. warning, info, debug, error. case insensitive
 log_batch_freq: 1                                                                  # batch frequency, how often to print training errors withinin the same epoch
-log_epoch_freq: 1                                                                  # epoch frequency, how often to print and save the model
+log_epoch_freq: 1                                                                  # epoch frequency, how often to print 
 save_checkpoint_freq: -1                                                           # frequency to save the intermediate checkpoint. no saving of intermediate checkpoints when the value is not positive.
 save_ema_checkpoint_freq: -1                                                       # frequency to save the intermediate ema checkpoint. no saving of intermediate checkpoints when the value is not positive.
 

From 96fdebfaf5e7e13b03179d64476776d7ebebaf55 Mon Sep 17 00:00:00 2001
From: Linux-cpp-lisp <1473644+Linux-cpp-lisp@users.noreply.github.com>
Date: Tue, 22 Feb 2022 11:56:28 -0500
Subject: [PATCH 40/53] shorter name

---
 CHANGELOG.md            | 2 +-
 nequip/train/metrics.py | 2 +-
 2 files changed, 2 insertions(+), 2 deletions(-)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index 212f1688..286548d6 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -13,7 +13,7 @@ Most recent change on the bottom.
 
 ### Changed
 - default value for `report_init_validation` is now `True`
-- `all_*_*` metrics rename to -> `ps_mean_*_*`
+- `all_*_*` metrics rename to -> `psavg_*_*`
 
 ### Fixed
 - error if both per-species and global shift are used together
diff --git a/nequip/train/metrics.py b/nequip/train/metrics.py
index 8256c30a..485e87d5 100644
--- a/nequip/train/metrics.py
+++ b/nequip/train/metrics.py
@@ -240,7 +240,7 @@ def flatten_metrics(self, metrics, type_names=None):
                         else:
                             flat_dict[f"{id_ele}_{item_name}"] = v.item()
 
-                    flat_dict[f"ps_mean_{item_name}"] = value.mean().item()
+                    flat_dict[f"psavg_{item_name}"] = value.mean().item()
                 else:
                     for id_ele, vec in enumerate(value):
                         ele = type_names[id_ele]

From ee82a33642b7f21fe0eed50d891cd20009f5e9e5 Mon Sep 17 00:00:00 2001
From: Simon Batzner <simonbatzner@gmail.com>
Date: Tue, 22 Feb 2022 11:58:12 -0500
Subject: [PATCH 41/53] add VASP special case

---
 configs/full.yaml | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/configs/full.yaml b/configs/full.yaml
index 19e00feb..64451518 100644
--- a/configs/full.yaml
+++ b/configs/full.yaml
@@ -89,6 +89,8 @@ use_sc: true
 # dataset_file_name: OUTCAR
 # ase_args:
 #   format: vasp-out
+# important VASP note: the ase vasp parser stores the potential energy to "free_energy" instead of "energy".
+# Here, the key_mapping maps the external name (key) to the NequIP default name (value)
 # key_mapping:
 #   free_energy: total_energy
 

From 040c8c477b534b751f7c298d3533e8c21b7627cd Mon Sep 17 00:00:00 2001
From: Linux-cpp-lisp <1473644+Linux-cpp-lisp@users.noreply.github.com>
Date: Tue, 22 Feb 2022 13:41:02 -0500
Subject: [PATCH 42/53] use fusion_strategy for >=1.11

---
 nequip/scripts/deploy.py | 29 ++++++++++++++++++++++++-----
 nequip/scripts/train.py  | 11 ++++++++---
 2 files changed, 32 insertions(+), 8 deletions(-)

diff --git a/nequip/scripts/deploy.py b/nequip/scripts/deploy.py
index 736de9a4..606529cb 100644
--- a/nequip/scripts/deploy.py
+++ b/nequip/scripts/deploy.py
@@ -20,7 +20,7 @@
 
 from e3nn.util.jit import script
 
-from nequip.scripts.train import _set_global_options
+from nequip.scripts.train import _set_global_options, default_config
 from nequip.train import Trainer
 from nequip.utils import Config
 from nequip.utils.versions import check_code_version, get_config_code_versions
@@ -34,6 +34,7 @@
 N_SPECIES_KEY: Final[str] = "n_species"
 TYPE_NAMES_KEY: Final[str] = "type_names"
 JIT_BAILOUT_KEY: Final[str] = "_jit_bailout_depth"
+JIT_FUSION_STRATEGY_KEY: Final[str] = "_jit_fusion_strategy"
 TF32_KEY: Final[str] = "allow_tf32"
 
 _ALL_METADATA_KEYS = [
@@ -45,6 +46,7 @@
     N_SPECIES_KEY,
     TYPE_NAMES_KEY,
     JIT_BAILOUT_KEY,
+    JIT_FUSION_STRATEGY_KEY,
     TF32_KEY,
 ]
 
@@ -113,14 +115,28 @@ def load_deployed_model(
                 torch.backends.cudnn.allow_tf32 = allow_tf32
 
         # JIT bailout
-        if metadata[JIT_BAILOUT_KEY] != "":
-            jit_bailout: int = int(metadata[JIT_BAILOUT_KEY])
+        if torch.__version__.split(".")[1] >= 11:
+            strategy = metadata.get(JIT_BAILOUT_KEY, "")
+            if strategy != "":
+                strategy = [e.split(",") for e in .split(";")]
+                strategy = [(e[0], int(e[1])) for e in strategy]
+            else:
+                strategy = default_config["_jit_fusion_strategy"]
             # no way to get current value, so assume we are overwriting it
             if set_global_options == "warn":
                 warnings.warn(
-                    "Loaded model had a different value for _jit_bailout_depth than was currently set; changing the GLOBAL setting!"
+                    "Loaded model had a different value for JIT fusion_strategy than was currently set; changing the GLOBAL setting!"
                 )
-            torch._C._jit_set_bailout_depth(jit_bailout)
+            torch.jit.set_fusion_strategy(strategy)
+        else:
+            if metadata[JIT_BAILOUT_KEY] != "":
+                jit_bailout: int = int(metadata[JIT_BAILOUT_KEY])
+                # no way to get current value, so assume we are overwriting it
+                if set_global_options == "warn":
+                    warnings.warn(
+                        "Loaded model had a different value for _jit_bailout_depth than was currently set; changing the GLOBAL setting!"
+                    )
+                torch._C._jit_set_bailout_depth(jit_bailout)
     return model, metadata
 
 
@@ -217,6 +233,9 @@ def main(args=None):
         metadata[N_SPECIES_KEY] = str(n_species)
         metadata[TYPE_NAMES_KEY] = " ".join(type_names)
 
+        metadata[JIT_FUSION_STRATEGY_KEY] = ";".join(
+            "%s,%i" % e for e in config.get("_jit_fusion_strategy", "")
+        )
         metadata[JIT_BAILOUT_KEY] = str(config["_jit_bailout_depth"])
         metadata[TF32_KEY] = str(int(config["allow_tf32"]))
         metadata[CONFIG_KEY] = (args.train_dir / "config.yaml").read_text()
diff --git a/nequip/scripts/train.py b/nequip/scripts/train.py
index f67f77b2..8aa55b8b 100644
--- a/nequip/scripts/train.py
+++ b/nequip/scripts/train.py
@@ -44,6 +44,7 @@
     grad_anomaly_mode=False,
     append=False,
     _jit_bailout_depth=2,  # avoid 20 iters of pain, see https://github.com/pytorch/pytorch/issues/52286
+    _jit_fusion_strategy=[("DYANMIC", 5)],  # for pytorch >= 1.11
 )
 
 
@@ -118,9 +119,13 @@ def _set_global_options(config):
             torch.backends.cuda.matmul.allow_tf32 = False
             torch.backends.cudnn.allow_tf32 = False
 
-    # For avoiding 20 steps of painfully slow JIT recompilation
-    # See https://github.com/pytorch/pytorch/issues/52286
-    torch._C._jit_set_bailout_depth(config["_jit_bailout_depth"])
+    if torch.__version__.split(".")[1] >= 11:
+        # PyTorch >= 1.11
+        torch.jit.set_fusion_strategy(config["_jit_fusion_strategy"])
+    else:
+        # For avoiding 20 steps of painfully slow JIT recompilation
+        # See https://github.com/pytorch/pytorch/issues/52286
+        torch._C._jit_set_bailout_depth(config["_jit_bailout_depth"])
 
     if config.model_debug_mode:
         set_irreps_debug(enabled=True)

From df1ba184838dd10a1127e1a285f94948a7c39feb Mon Sep 17 00:00:00 2001
From: Linux-cpp-lisp <1473644+Linux-cpp-lisp@users.noreply.github.com>
Date: Tue, 22 Feb 2022 13:51:32 -0500
Subject: [PATCH 43/53] Revert "use fusion_strategy for >=1.11"

This reverts commit 040c8c477b534b751f7c298d3533e8c21b7627cd.
---
 nequip/scripts/deploy.py | 29 +++++------------------------
 nequip/scripts/train.py  | 11 +++--------
 2 files changed, 8 insertions(+), 32 deletions(-)

diff --git a/nequip/scripts/deploy.py b/nequip/scripts/deploy.py
index 606529cb..736de9a4 100644
--- a/nequip/scripts/deploy.py
+++ b/nequip/scripts/deploy.py
@@ -20,7 +20,7 @@
 
 from e3nn.util.jit import script
 
-from nequip.scripts.train import _set_global_options, default_config
+from nequip.scripts.train import _set_global_options
 from nequip.train import Trainer
 from nequip.utils import Config
 from nequip.utils.versions import check_code_version, get_config_code_versions
@@ -34,7 +34,6 @@
 N_SPECIES_KEY: Final[str] = "n_species"
 TYPE_NAMES_KEY: Final[str] = "type_names"
 JIT_BAILOUT_KEY: Final[str] = "_jit_bailout_depth"
-JIT_FUSION_STRATEGY_KEY: Final[str] = "_jit_fusion_strategy"
 TF32_KEY: Final[str] = "allow_tf32"
 
 _ALL_METADATA_KEYS = [
@@ -46,7 +45,6 @@
     N_SPECIES_KEY,
     TYPE_NAMES_KEY,
     JIT_BAILOUT_KEY,
-    JIT_FUSION_STRATEGY_KEY,
     TF32_KEY,
 ]
 
@@ -115,28 +113,14 @@ def load_deployed_model(
                 torch.backends.cudnn.allow_tf32 = allow_tf32
 
         # JIT bailout
-        if torch.__version__.split(".")[1] >= 11:
-            strategy = metadata.get(JIT_BAILOUT_KEY, "")
-            if strategy != "":
-                strategy = [e.split(",") for e in .split(";")]
-                strategy = [(e[0], int(e[1])) for e in strategy]
-            else:
-                strategy = default_config["_jit_fusion_strategy"]
+        if metadata[JIT_BAILOUT_KEY] != "":
+            jit_bailout: int = int(metadata[JIT_BAILOUT_KEY])
             # no way to get current value, so assume we are overwriting it
             if set_global_options == "warn":
                 warnings.warn(
-                    "Loaded model had a different value for JIT fusion_strategy than was currently set; changing the GLOBAL setting!"
+                    "Loaded model had a different value for _jit_bailout_depth than was currently set; changing the GLOBAL setting!"
                 )
-            torch.jit.set_fusion_strategy(strategy)
-        else:
-            if metadata[JIT_BAILOUT_KEY] != "":
-                jit_bailout: int = int(metadata[JIT_BAILOUT_KEY])
-                # no way to get current value, so assume we are overwriting it
-                if set_global_options == "warn":
-                    warnings.warn(
-                        "Loaded model had a different value for _jit_bailout_depth than was currently set; changing the GLOBAL setting!"
-                    )
-                torch._C._jit_set_bailout_depth(jit_bailout)
+            torch._C._jit_set_bailout_depth(jit_bailout)
     return model, metadata
 
 
@@ -233,9 +217,6 @@ def main(args=None):
         metadata[N_SPECIES_KEY] = str(n_species)
         metadata[TYPE_NAMES_KEY] = " ".join(type_names)
 
-        metadata[JIT_FUSION_STRATEGY_KEY] = ";".join(
-            "%s,%i" % e for e in config.get("_jit_fusion_strategy", "")
-        )
         metadata[JIT_BAILOUT_KEY] = str(config["_jit_bailout_depth"])
         metadata[TF32_KEY] = str(int(config["allow_tf32"]))
         metadata[CONFIG_KEY] = (args.train_dir / "config.yaml").read_text()
diff --git a/nequip/scripts/train.py b/nequip/scripts/train.py
index 8aa55b8b..f67f77b2 100644
--- a/nequip/scripts/train.py
+++ b/nequip/scripts/train.py
@@ -44,7 +44,6 @@
     grad_anomaly_mode=False,
     append=False,
     _jit_bailout_depth=2,  # avoid 20 iters of pain, see https://github.com/pytorch/pytorch/issues/52286
-    _jit_fusion_strategy=[("DYANMIC", 5)],  # for pytorch >= 1.11
 )
 
 
@@ -119,13 +118,9 @@ def _set_global_options(config):
             torch.backends.cuda.matmul.allow_tf32 = False
             torch.backends.cudnn.allow_tf32 = False
 
-    if torch.__version__.split(".")[1] >= 11:
-        # PyTorch >= 1.11
-        torch.jit.set_fusion_strategy(config["_jit_fusion_strategy"])
-    else:
-        # For avoiding 20 steps of painfully slow JIT recompilation
-        # See https://github.com/pytorch/pytorch/issues/52286
-        torch._C._jit_set_bailout_depth(config["_jit_bailout_depth"])
+    # For avoiding 20 steps of painfully slow JIT recompilation
+    # See https://github.com/pytorch/pytorch/issues/52286
+    torch._C._jit_set_bailout_depth(config["_jit_bailout_depth"])
 
     if config.model_debug_mode:
         set_irreps_debug(enabled=True)

From c0dda76bec2cfbb347c10230e0a4aaaa53346055 Mon Sep 17 00:00:00 2001
From: Alby M <1473644+Linux-cpp-lisp@users.noreply.github.com>
Date: Tue, 22 Feb 2022 14:57:58 -0500
Subject: [PATCH 44/53] Fix N shape bugs (#157)

* fix for peratom

* checks in per_species

* fix assert

* add some asserts

* add per atom unit tests

* refine assert

* mean_std over dim=0 only

* test global vector quantity

* better error

* energies are 1D, flatten

* correct assertion

* fixed assert

Co-authored-by: nw13slx <nw13mifaso@gmail.com>
---
 nequip/data/dataset.py          | 21 ++++++++---
 nequip/data/transforms.py       |  4 ++-
 nequip/model/_scaling.py        |  4 +--
 nequip/train/_loss.py           | 14 ++++++--
 tests/unit/data/test_dataset.py | 63 +++++++++++++++++++++++++++++++++
 5 files changed, 96 insertions(+), 10 deletions(-)

diff --git a/nequip/data/dataset.py b/nequip/data/dataset.py
index 44afe560..9d62b20f 100644
--- a/nequip/data/dataset.py
+++ b/nequip/data/dataset.py
@@ -537,13 +537,18 @@ def _per_atom_statistics(
         """
         # using unique_consecutive handles the non-contiguous selected batch index
         _, N = torch.unique_consecutive(batch, return_counts=True)
+        N = N.unsqueeze(-1)
+        assert N.ndim == 2
+        assert N.shape == (len(arr), 1)
+        assert arr.ndim >= 2
+        data_dim = arr.shape[1:]
+        arr = arr / N
+        assert arr.shape == (len(N),) + data_dim
         if ana_mode == "mean_std":
-            arr = arr / N
-            mean = torch.mean(arr)
-            std = torch.std(arr, unbiased=unbiased)
+            mean = torch.mean(arr, dim=0)
+            std = torch.std(arr, unbiased=unbiased, dim=0)
             return mean, std
         elif ana_mode == "rms":
-            arr = arr / N
             return (torch.sqrt(torch.mean(arr.square())),)
         else:
             raise NotImplementedError(
@@ -567,8 +572,9 @@ def _per_species_statistics(
         For a per-node quantity, computes the expected statistic but for each type instead of over all nodes.
         """
         N = bincount(atom_types.squeeze(-1), batch)
+        assert N.ndim == 2  # [batch, n_type]
         N = N[(N > 0).any(dim=1)]  # deal with non-contiguous batch indexes
-
+        assert arr.ndim >= 2
         if arr_is_per == "graph":
 
             if ana_mode != "mean_std":
@@ -585,10 +591,15 @@ def _per_species_statistics(
 
             if ana_mode == "mean_std":
                 mean = scatter_mean(arr, atom_types, dim=0)
+                assert mean.shape[1:] == arr.shape[1:]  # [N, dims] -> [type, dims]
+                assert len(mean) == N.shape[1]
                 std = scatter_std(arr, atom_types, dim=0, unbiased=unbiased)
+                assert std.shape == mean.shape
                 return mean, std
             elif ana_mode == "rms":
                 square = scatter_mean(arr.square(), atom_types, dim=0)
+                assert square.shape[1:] == arr.shape[1:]  # [N, dims] -> [type, dims]
+                assert len(square) == N.shape[1]
                 dims = len(square.shape) - 1
                 for i in range(dims):
                     square = square.mean(axis=-1)
diff --git a/nequip/data/transforms.py b/nequip/data/transforms.py
index b5c77a32..f2c7ec32 100644
--- a/nequip/data/transforms.py
+++ b/nequip/data/transforms.py
@@ -150,4 +150,6 @@ def format(
                 + "]"
             ).format(*zip(type_names, data))
         else:
-            raise ValueError
+            raise ValueError(
+                f"Don't know how to format data=`{data}` for types {type_names} with element_formatter=`{element_formatter}`"
+            )
diff --git a/nequip/model/_scaling.py b/nequip/model/_scaling.py
index dba8aa35..03ce4f79 100644
--- a/nequip/model/_scaling.py
+++ b/nequip/model/_scaling.py
@@ -208,14 +208,14 @@ def PerSpeciesRescale(
 
         if isinstance(scales, str):
             s = scales
-            scales = computed_stats[str_names.index(scales)]
+            scales = computed_stats[str_names.index(scales)].squeeze(-1)  # energy is 1D
             logging.info(f"Replace string {s} to {scales}")
         elif isinstance(scales, (list, float)):
             scales = torch.as_tensor(scales)
 
         if isinstance(shifts, str):
             s = shifts
-            shifts = computed_stats[str_names.index(shifts)]
+            shifts = computed_stats[str_names.index(shifts)].squeeze(-1)  # energy is 1D
             logging.info(f"Replace string {s} to {shifts}")
         elif isinstance(shifts, (list, float)):
             shifts = torch.as_tensor(shifts)
diff --git a/nequip/train/_loss.py b/nequip/train/_loss.py
index 07ec8c80..6df59fe3 100644
--- a/nequip/train/_loss.py
+++ b/nequip/train/_loss.py
@@ -80,6 +80,7 @@ def __call__(
             )
             if self.func_name == "MSELoss":
                 loss = loss / N
+            assert loss.shape == pred[key].shape  # [atom, dim]
             if mean:
                 return loss.sum() / not_nan.sum()
             else:
@@ -89,6 +90,7 @@ def __call__(
             loss = loss / N
             if self.func_name == "MSELoss":
                 loss = loss / N
+            assert loss.shape == pred[key].shape  # [atom, dim]
             if mean:
                 return loss.mean()
             else:
@@ -128,25 +130,33 @@ def __call__(
         if has_nan:
             if len(reduce_dims) > 0:
                 per_atom_loss = per_atom_loss.sum(dim=reduce_dims)
+            assert per_atom_loss.ndim == 1
 
             per_species_loss = scatter(per_atom_loss, spe_idx, dim=0)
 
+            assert per_species_loss.ndim == 1  # [type]
+
             N = scatter(not_nan, spe_idx, dim=0)
             N = N.sum(reduce_dims)
-            N = 1.0 / N
+            N = N.reciprocal()
             N_species = ((N == N).int()).sum()
+            assert N.ndim == 1  # [type]
+
+            per_species_loss = (per_species_loss * N).sum() / N_species
 
-            return (per_species_loss * N).sum() / N_species
+            return per_species_loss
 
         else:
 
             if len(reduce_dims) > 0:
                 per_atom_loss = per_atom_loss.mean(dim=reduce_dims)
+            assert per_atom_loss.ndim == 1
 
             # offset species index by 1 to use 0 for nan
             _, inverse_species_index = torch.unique(spe_idx, return_inverse=True)
 
             per_species_loss = scatter_mean(per_atom_loss, inverse_species_index, dim=0)
+            assert per_species_loss.ndim == 1  # [type]
 
             return per_species_loss.mean()
 
diff --git a/tests/unit/data/test_dataset.py b/tests/unit/data/test_dataset.py
index e580a49a..a05e963d 100644
--- a/tests/unit/data/test_dataset.py
+++ b/tests/unit/data/test_dataset.py
@@ -13,6 +13,8 @@
     NpzDataset,
     ASEDataset,
     dataset_from_config,
+    register_fields,
+    deregister_fields,
 )
 from nequip.data.transforms import TypeMapper
 from nequip.utils import Config
@@ -188,6 +190,67 @@ def test_edgewise_stats(self, npz_dataset):
         # TODO: check correct
 
 
+class TestPerAtomStatistics:
+    @pytest.mark.parametrize("mode", ["mean_std", "rms"])
+    def test_per_node_field(self, npz_dataset, mode):
+        # set up the transformer
+        npz_dataset = set_up_transformer(npz_dataset, True, False, False)
+
+        with pytest.raises(ValueError) as excinfo:
+            npz_dataset.statistics(
+                [AtomicDataDict.BATCH_KEY],
+                modes=[f"per_atom_{mode}"],
+            )
+            assert (
+                excinfo
+                == f"It doesn't make sense to ask for `{mode}` since `{AtomicDataDict.BATCH_KEY}` is not per-graph"
+            )
+
+    @pytest.mark.parametrize("fixed_field", [True, False])
+    @pytest.mark.parametrize("full_rank", [True, False])
+    @pytest.mark.parametrize("subset", [True, False])
+    @pytest.mark.parametrize(
+        "key,dim", [(AtomicDataDict.TOTAL_ENERGY_KEY, (1,)), ("somekey", (3,))]
+    )
+    def test_per_graph_field(
+        self, npz_dataset, fixed_field, full_rank, subset, key, dim
+    ):
+        if key == "somekey":
+            register_fields(graph_fields=[key])
+
+        npz_dataset = set_up_transformer(npz_dataset, full_rank, fixed_field, subset)
+        if npz_dataset is None:
+            return
+
+        E = torch.rand((npz_dataset.len(),) + dim)
+        ref_mean = torch.mean(E / NATOMS, dim=0)
+        ref_std = torch.std(E / NATOMS, dim=0)
+
+        if subset:
+            E_orig_order = torch.zeros(
+                (npz_dataset.data[AtomicDataDict.TOTAL_ENERGY_KEY].shape[0],) + dim
+            )
+            E_orig_order[npz_dataset._indices] = E
+            npz_dataset.data[key] = E_orig_order
+        else:
+            npz_dataset.data[key] = E
+
+        ((mean, std),) = npz_dataset.statistics(
+            [key],
+            modes=["per_atom_mean_std"],
+        )
+
+        print("mean", mean, ref_mean)
+        print("diff in mean", mean - ref_mean)
+        print("std", std, ref_std)
+
+        assert torch.allclose(mean, ref_mean, rtol=1e-1)
+        assert torch.allclose(std, ref_std, rtol=1e-2)
+
+        if key == "somekey":
+            deregister_fields(key)
+
+
 class TestPerSpeciesStatistics:
     @pytest.mark.parametrize("fixed_field", [True, False])
     @pytest.mark.parametrize("mode", ["mean_std", "rms"])

From 2186560e16c6e0b8b5b3c26b03d4d7ddf76b3d14 Mon Sep 17 00:00:00 2001
From: Linux-cpp-lisp <1473644+Linux-cpp-lisp@users.noreply.github.com>
Date: Tue, 22 Feb 2022 15:12:47 -0500
Subject: [PATCH 45/53] wandb record number of weights

---
 CHANGELOG.md            | 1 +
 nequip/scripts/train.py | 7 ++++++-
 nequip/train/trainer.py | 5 -----
 3 files changed, 7 insertions(+), 6 deletions(-)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index d30582b9..1c13b12d 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -10,6 +10,7 @@ Most recent change on the bottom.
 ## [Unreleased] - 0.5.3
 ### Added
 - `nequip-evaluate --repeat` option
+- Report number of weights to wandb
 
 ### Changed
 
diff --git a/nequip/scripts/train.py b/nequip/scripts/train.py
index f67f77b2..d716f6da 100644
--- a/nequip/scripts/train.py
+++ b/nequip/scripts/train.py
@@ -178,8 +178,13 @@ def fresh_start(config):
     final_model = model_from_config(
         config=config, initialize=True, dataset=trainer.dataset_train
     )
-
     logging.info("Successfully built the network...")
+    num_weights: int = sum(p.numel() for p in final_model.parameters())
+    logging.info(f"Number of weights: {num_weights}")
+    # upload it to wandb
+    if config.wandb:
+        # we've already imported wandb in an earlier `if`
+        wandb.config.update({"num_weights": num_weights})
 
     # by doing this here we check also any keys custom builders may have added
     _check_old_keys(config)
diff --git a/nequip/train/trainer.py b/nequip/train/trainer.py
index f7a9b3e4..25a5e7ed 100644
--- a/nequip/train/trainer.py
+++ b/nequip/train/trainer.py
@@ -741,11 +741,6 @@ def train(self):
             raise RuntimeError("You must call `set_dataset()` before calling `train()`")
         if not self._initialized:
             self.init()
-            self.logger.info(
-                "Number of weights: {}".format(
-                    sum(p.numel() for p in self.model.parameters())
-                )
-            )
 
         for callback in self._init_callbacks:
             callback(self)

From 34db05d2c70c1dccd223f32e8dd354d982480c58 Mon Sep 17 00:00:00 2001
From: Linux-cpp-lisp <1473644+Linux-cpp-lisp@users.noreply.github.com>
Date: Tue, 22 Feb 2022 15:21:52 -0500
Subject: [PATCH 46/53] move wandb logging to wanbd trainer

---
 nequip/scripts/train.py       | 6 ------
 nequip/train/trainer.py       | 3 +++
 nequip/train/trainer_wandb.py | 3 +++
 3 files changed, 6 insertions(+), 6 deletions(-)

diff --git a/nequip/scripts/train.py b/nequip/scripts/train.py
index d716f6da..a4304e5b 100644
--- a/nequip/scripts/train.py
+++ b/nequip/scripts/train.py
@@ -179,12 +179,6 @@ def fresh_start(config):
         config=config, initialize=True, dataset=trainer.dataset_train
     )
     logging.info("Successfully built the network...")
-    num_weights: int = sum(p.numel() for p in final_model.parameters())
-    logging.info(f"Number of weights: {num_weights}")
-    # upload it to wandb
-    if config.wandb:
-        # we've already imported wandb in an earlier `if`
-        wandb.config.update({"num_weights": num_weights})
 
     # by doing this here we check also any keys custom builders may have added
     _check_old_keys(config)
diff --git a/nequip/train/trainer.py b/nequip/train/trainer.py
index 25a5e7ed..6257fbca 100644
--- a/nequip/train/trainer.py
+++ b/nequip/train/trainer.py
@@ -699,6 +699,9 @@ def init(self):
 
         self.model.to(self.torch_device)
 
+        self.num_weights = sum(p.numel() for p in self.model.parameters())
+        self.logger.info(f"Number of weights: {self.num_weights}")
+
         self.rescale_layers = []
         outer_layer = self.model
         while hasattr(outer_layer, "unscale"):
diff --git a/nequip/train/trainer_wandb.py b/nequip/train/trainer_wandb.py
index deed5206..8bbcb1b9 100644
--- a/nequip/train/trainer_wandb.py
+++ b/nequip/train/trainer_wandb.py
@@ -16,6 +16,9 @@ def init(self):
         if not self._initialized:
             return
 
+        # upload some new fields to wandb
+        wandb.config.update({"num_weights": self.num_weights})
+
         if self.kwargs.get("wandb_watch", False):
             wandb_watch_kwargs = self.kwargs.get("wandb_watch_kwargs", {})
             wandb.watch(self.model, **wandb_watch_kwargs)

From 405cc19cebf8dff304c9171aa7b7d0d92fc3ea09 Mon Sep 17 00:00:00 2001
From: Linux-cpp-lisp <1473644+Linux-cpp-lisp@users.noreply.github.com>
Date: Wed, 23 Feb 2022 13:15:52 -0500
Subject: [PATCH 47/53] set avg_num_neighbors=auto by default

---
 CHANGELOG.md                  | 2 +-
 nequip/model/builder_utils.py | 2 +-
 2 files changed, 2 insertions(+), 2 deletions(-)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index 1c13b12d..230fd730 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -13,11 +13,11 @@ Most recent change on the bottom.
 - Report number of weights to wandb
 
 ### Changed
-
 - defaults and commments in example.yaml and full.yaml, in particular longer default training and correct comment for E:F-weighting
 - better metrics config in example.yaml and full.yaml, in particular will total F-MAE/F-RMSE instead of mean over per-species
 - default value for `report_init_validation` is now `True`
 - `all_*_*` metrics rename to -> `psavg_*_*`
+- `avg_num_neighbors` default `None` -> `auto`
 
 ### Fixed
 - error if both per-species and global shift are used together
diff --git a/nequip/model/builder_utils.py b/nequip/model/builder_utils.py
index 5c0ec04a..1cbe411c 100644
--- a/nequip/model/builder_utils.py
+++ b/nequip/model/builder_utils.py
@@ -27,7 +27,7 @@ def add_avg_num_neighbors(
 ) -> Optional[float]:
     # Compute avg_num_neighbors
     annkey: str = "avg_num_neighbors"
-    ann = config.get(annkey, None)
+    ann = config.get(annkey, "auto")
     if ann == "auto":
         if not initialize:
             raise ValueError("avg_num_neighbors = auto but initialize is False")

From c7c0af6b547c3719c4f795159f16a173f84a2b17 Mon Sep 17 00:00:00 2001
From: nw13slx <nw13mifaso@gmail.com>
Date: Wed, 23 Feb 2022 13:49:19 -0500
Subject: [PATCH 48/53] update test_dataset for asserts

---
 tests/unit/data/test_dataset.py | 31 +++++++++++++++++++------------
 1 file changed, 19 insertions(+), 12 deletions(-)

diff --git a/tests/unit/data/test_dataset.py b/tests/unit/data/test_dataset.py
index a05e963d..7f860431 100644
--- a/tests/unit/data/test_dataset.py
+++ b/tests/unit/data/test_dataset.py
@@ -207,18 +207,17 @@ def test_per_node_field(self, npz_dataset, mode):
             )
 
     @pytest.mark.parametrize("fixed_field", [True, False])
-    @pytest.mark.parametrize("full_rank", [True, False])
     @pytest.mark.parametrize("subset", [True, False])
     @pytest.mark.parametrize(
         "key,dim", [(AtomicDataDict.TOTAL_ENERGY_KEY, (1,)), ("somekey", (3,))]
     )
     def test_per_graph_field(
-        self, npz_dataset, fixed_field, full_rank, subset, key, dim
+        self, npz_dataset, fixed_field, subset, key, dim
     ):
         if key == "somekey":
             register_fields(graph_fields=[key])
 
-        npz_dataset = set_up_transformer(npz_dataset, full_rank, fixed_field, subset)
+        npz_dataset = set_up_transformer(npz_dataset, True, fixed_field, subset)
         if npz_dataset is None:
             return
 
@@ -267,7 +266,7 @@ def test_per_node_field(self, npz_dataset, fixed_field, mode, subset):
         )
         print(result)
 
-    @pytest.mark.parametrize("alpha", [1e-10, 1e-6, 0.1, 0.5, 1])
+    @pytest.mark.parametrize("alpha", [1e-5, 1e-3, 0.1, 0.5])
     @pytest.mark.parametrize("fixed_field", [True, False])
     @pytest.mark.parametrize("full_rank", [True, False])
     @pytest.mark.parametrize("subset", [True, False])
@@ -278,6 +277,9 @@ def test_per_graph_field(
         self, npz_dataset, alpha, fixed_field, full_rank, regressor, subset
     ):
 
+        if alpha <= 1e-4 and not full_rank:
+            return
+
         npz_dataset = set_up_transformer(npz_dataset, full_rank, fixed_field, subset)
         if npz_dataset is None:
             return
@@ -295,10 +297,10 @@ def test_per_graph_field(
         del n_spec
         del Ns
 
-        if alpha == 1e-10:
-            ref_mean, ref_std, E = generate_E(N, 100, 0.0)
+        if alpha == 1e-5:
+            ref_mean, ref_std, E = generate_E(N, 1000, 0.0)
         else:
-            ref_mean, ref_std, E = generate_E(N, 100, 0.5)
+            ref_mean, ref_std, E = generate_E(N, 1000, 0.5)
 
         if subset:
             E_orig_order = torch.zeros_like(
@@ -333,11 +335,16 @@ def test_per_graph_field(
         print("diff in mean", mean - ref_mean)
         print("std", std, ref_std)
 
-        if alpha == 1e-10 and full_rank:
-            assert torch.allclose(mean, ref_mean, rtol=1e-1)
-            assert torch.allclose(std, torch.zeros_like(ref_mean), atol=1e-2)
-        # else:
-        #     assert res2 > ref_res2
+        if full_rank:
+            if alpha == 1e-5:
+                assert torch.allclose(mean, ref_mean, rtol=1e-1)
+            else:
+                assert torch.allclose(mean, ref_mean, rtol=8e-1)
+                assert torch.allclose(std, torch.zeros_like(ref_mean), atol=alpha*100)
+        elif regressor == "NormalizedGaussianProcess":
+            assert torch.std(mean).numpy() ==0
+        else:
+            assert mean[0] == mean[1]*2
 
 
 class TestReload:

From 29804cfb17d1750744c6523e4dc4b6dfa62bc3a9 Mon Sep 17 00:00:00 2001
From: nw13slx <nw13mifaso@gmail.com>
Date: Wed, 23 Feb 2022 13:50:44 -0500
Subject: [PATCH 49/53] format

---
 tests/unit/data/test_dataset.py | 10 ++++------
 1 file changed, 4 insertions(+), 6 deletions(-)

diff --git a/tests/unit/data/test_dataset.py b/tests/unit/data/test_dataset.py
index 7f860431..b0af9049 100644
--- a/tests/unit/data/test_dataset.py
+++ b/tests/unit/data/test_dataset.py
@@ -211,9 +211,7 @@ def test_per_node_field(self, npz_dataset, mode):
     @pytest.mark.parametrize(
         "key,dim", [(AtomicDataDict.TOTAL_ENERGY_KEY, (1,)), ("somekey", (3,))]
     )
-    def test_per_graph_field(
-        self, npz_dataset, fixed_field, subset, key, dim
-    ):
+    def test_per_graph_field(self, npz_dataset, fixed_field, subset, key, dim):
         if key == "somekey":
             register_fields(graph_fields=[key])
 
@@ -340,11 +338,11 @@ def test_per_graph_field(
                 assert torch.allclose(mean, ref_mean, rtol=1e-1)
             else:
                 assert torch.allclose(mean, ref_mean, rtol=8e-1)
-                assert torch.allclose(std, torch.zeros_like(ref_mean), atol=alpha*100)
+                assert torch.allclose(std, torch.zeros_like(ref_mean), atol=alpha * 100)
         elif regressor == "NormalizedGaussianProcess":
-            assert torch.std(mean).numpy() ==0
+            assert torch.std(mean).numpy() == 0
         else:
-            assert mean[0] == mean[1]*2
+            assert mean[0] == mean[1] * 2
 
 
 class TestReload:

From 7a31f3287719d3a371d613e0ac12e91bc05c9912 Mon Sep 17 00:00:00 2001
From: nw13slx <nw13mifaso@gmail.com>
Date: Wed, 23 Feb 2022 14:17:23 -0500
Subject: [PATCH 50/53] loose the fitting criteria in unit test for python 3.6

---
 tests/unit/data/test_dataset.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/unit/data/test_dataset.py b/tests/unit/data/test_dataset.py
index b0af9049..f0a04832 100644
--- a/tests/unit/data/test_dataset.py
+++ b/tests/unit/data/test_dataset.py
@@ -337,7 +337,7 @@ def test_per_graph_field(
             if alpha == 1e-5:
                 assert torch.allclose(mean, ref_mean, rtol=1e-1)
             else:
-                assert torch.allclose(mean, ref_mean, rtol=8e-1)
+                assert torch.allclose(mean, ref_mean, rtol=2)
                 assert torch.allclose(std, torch.zeros_like(ref_mean), atol=alpha * 100)
         elif regressor == "NormalizedGaussianProcess":
             assert torch.std(mean).numpy() == 0

From 97c7059be9e232b4a8319fe553a70e06078df468 Mon Sep 17 00:00:00 2001
From: Linux-cpp-lisp <1473644+Linux-cpp-lisp@users.noreply.github.com>
Date: Wed, 23 Feb 2022 14:45:36 -0500
Subject: [PATCH 51/53] mark release

---
 CHANGELOG.md | 4 +++-
 1 file changed, 3 insertions(+), 1 deletion(-)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index 230fd730..df941fe3 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -7,7 +7,9 @@ and this project adheres to [Semantic Versioning](https://semver.org/spec/v2.0.0
 Most recent change on the bottom.
 
 
-## [Unreleased] - 0.5.3
+## [Unreleased]
+
+## [0.5.3] - 2022-02-23
 ### Added
 - `nequip-evaluate --repeat` option
 - Report number of weights to wandb

From 929a4b79ac452264c38d0e956e1ab85d9072fde4 Mon Sep 17 00:00:00 2001
From: Linux-cpp-lisp <1473644+Linux-cpp-lisp@users.noreply.github.com>
Date: Wed, 23 Feb 2022 15:31:46 -0500
Subject: [PATCH 52/53] sklearn version avoid bug

---
 setup.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/setup.py b/setup.py
index bf46b7de..c9e931ae 100644
--- a/setup.py
+++ b/setup.py
@@ -37,7 +37,7 @@
         "typing_extensions;python_version<'3.8'",  # backport of Final
         "torch-runstats>=0.2.0",
         "torch-ema>=0.3.0",
-        "scikit_learn",  # for GaussianProcess for per-species statistics
+        "scikit_learn==1.0.1",  # for GaussianProcess for per-species statistics; 1.0.2 has a bug!
     ],
     zip_safe=True,
 )

From 203f1fcb84e4c128e9206f19604264c338b30d56 Mon Sep 17 00:00:00 2001
From: Linux-cpp-lisp <1473644+Linux-cpp-lisp@users.noreply.github.com>
Date: Wed, 23 Feb 2022 15:35:17 -0500
Subject: [PATCH 53/53] version fix for old python

---
 setup.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/setup.py b/setup.py
index c9e931ae..ad57b290 100644
--- a/setup.py
+++ b/setup.py
@@ -37,7 +37,7 @@
         "typing_extensions;python_version<'3.8'",  # backport of Final
         "torch-runstats>=0.2.0",
         "torch-ema>=0.3.0",
-        "scikit_learn==1.0.1",  # for GaussianProcess for per-species statistics; 1.0.2 has a bug!
+        "scikit_learn<=1.0.1",  # for GaussianProcess for per-species statistics; 1.0.2 has a bug!
     ],
     zip_safe=True,
 )