From 287d8606099b69e77f58ac967dc8e89b2ef9aaa2 Mon Sep 17 00:00:00 2001
From: jrudz <rudzinski@mpip-mainz.mpg.de>
Date: Thu, 4 Jan 2024 11:39:50 +0100
Subject: [PATCH] added default assignment of unknown atom labels

---
 atomisticparsers/lammps/parser.py | 1358 +++++++++++++++++++----------
 1 file changed, 910 insertions(+), 448 deletions(-)

diff --git a/atomisticparsers/lammps/parser.py b/atomisticparsers/lammps/parser.py
index ad47346f..91f75353 100644
--- a/atomisticparsers/lammps/parser.py
+++ b/atomisticparsers/lammps/parser.py
@@ -26,77 +26,157 @@
 from nomad.parsing.file_parser import Quantity, TextParser
 from nomad.datamodel.metainfo.simulation.run import Run, Program
 from nomad.datamodel.metainfo.simulation.method import (
-    NeighborSearching, ForceCalculations, ForceField, Method, Model, AtomParameters
-)
-from nomad.datamodel.metainfo.simulation.system import (
-    AtomsGroup
+    NeighborSearching,
+    ForceCalculations,
+    ForceField,
+    Method,
+    Model,
+    AtomParameters,
 )
+from nomad.datamodel.metainfo.simulation.system import AtomsGroup
 from simulationworkflowschema import (
-    GeometryOptimization, GeometryOptimizationMethod, GeometryOptimizationResults
+    GeometryOptimization,
+    GeometryOptimizationMethod,
+    GeometryOptimizationResults,
+)
+from .metainfo.lammps import (
+    x_lammps_section_input_output_files,
+    x_lammps_section_control_parameters,
 )
-from .metainfo.lammps import x_lammps_section_input_output_files, x_lammps_section_control_parameters
 from atomisticparsers.utils import MDAnalysisParser, MDParser
 from nomad.atomutils import get_bond_list_from_model_contributions
 
 
-re_float = r'[-+]?\d+\.*\d*(?:[Ee][-+]\d+)?'
-re_n = r'[\n\r]'
+re_float = r"[-+]?\d+\.*\d*(?:[Ee][-+]\d+)?"
+re_n = r"[\n\r]"
 
 
 def get_unit(units_type, property_type=None, dimension=3):
-    mole = 6.022140857e+23
+    mole = 6.022140857e23
 
     units_type = units_type.lower()
-    if units_type == 'real':
+    if units_type == "real":
         units = dict(
-            mass=ureg.g / mole, distance=ureg.angstrom, time=ureg.fs,
-            energy=ureg.J * 4184.0 / mole, velocity=ureg.angstrom / ureg.fs,
-            force=ureg.J * 4184.0 / ureg.angstrom / mole, torque=ureg.J * 4184.0 / mole,
-            temperature=ureg.K, pressure=ureg.atm, dynamic_viscosity=ureg.poise, charge=ureg.elementary_charge,
-            dipole=ureg.elementary_charge * ureg.angstrom, electric_field=ureg.V / ureg.angstrom,
-            density=ureg.g / ureg.cm ** dimension)
-
-    elif units_type == 'metal':
+            mass=ureg.g / mole,
+            distance=ureg.angstrom,
+            time=ureg.fs,
+            energy=ureg.J * 4184.0 / mole,
+            velocity=ureg.angstrom / ureg.fs,
+            force=ureg.J * 4184.0 / ureg.angstrom / mole,
+            torque=ureg.J * 4184.0 / mole,
+            temperature=ureg.K,
+            pressure=ureg.atm,
+            dynamic_viscosity=ureg.poise,
+            charge=ureg.elementary_charge,
+            dipole=ureg.elementary_charge * ureg.angstrom,
+            electric_field=ureg.V / ureg.angstrom,
+            density=ureg.g / ureg.cm**dimension,
+        )
+
+    elif units_type == "metal":
         units = dict(
-            mass=ureg.g / mole, distance=ureg.angstrom, time=ureg.ps,
-            energy=ureg.eV, velocity=ureg.angstrom / ureg.ps, force=ureg.eV / ureg.angstrom, torque=ureg.eV,
-            temperature=ureg.K, pressure=ureg.bar, dynamic_viscosity=ureg.poise, charge=ureg.elementary_charge,
-            dipole=ureg.elementary_charge * ureg.angstrom, electric_field=ureg.V / ureg.angstrom,
-            density=ureg.g / ureg.cm ** dimension)
+            mass=ureg.g / mole,
+            distance=ureg.angstrom,
+            time=ureg.ps,
+            energy=ureg.eV,
+            velocity=ureg.angstrom / ureg.ps,
+            force=ureg.eV / ureg.angstrom,
+            torque=ureg.eV,
+            temperature=ureg.K,
+            pressure=ureg.bar,
+            dynamic_viscosity=ureg.poise,
+            charge=ureg.elementary_charge,
+            dipole=ureg.elementary_charge * ureg.angstrom,
+            electric_field=ureg.V / ureg.angstrom,
+            density=ureg.g / ureg.cm**dimension,
+        )
 
-    elif units_type == 'si':
+    elif units_type == "si":
         units = dict(
-            mass=ureg.kg, distance=ureg.m, time=ureg.s, energy=ureg.J, velocity=ureg.m / ureg.s, force=ureg.N,
-            torque=ureg.N * ureg.m, temperature=ureg.K, pressure=ureg.Pa, dynamic_viscosity=ureg.Pa * ureg.s,
-            charge=ureg.C, dipole=ureg.C * ureg.m, electric_field=ureg.V / ureg.m, density=ureg.kg / ureg.m ** dimension)
+            mass=ureg.kg,
+            distance=ureg.m,
+            time=ureg.s,
+            energy=ureg.J,
+            velocity=ureg.m / ureg.s,
+            force=ureg.N,
+            torque=ureg.N * ureg.m,
+            temperature=ureg.K,
+            pressure=ureg.Pa,
+            dynamic_viscosity=ureg.Pa * ureg.s,
+            charge=ureg.C,
+            dipole=ureg.C * ureg.m,
+            electric_field=ureg.V / ureg.m,
+            density=ureg.kg / ureg.m**dimension,
+        )
 
-    elif units_type == 'cgs':
+    elif units_type == "cgs":
         units = dict(
-            mass=ureg.g, distance=ureg.cm, time=ureg.s, energy=ureg.erg, velocity=ureg.cm / ureg.s, force=ureg.dyne,
-            torque=ureg.dyne * ureg.cm, temperature=ureg.K, pressure=ureg.dyne / ureg. cm ** 2, dynamic_viscosity=ureg.poise,
-            charge=ureg.esu, dipole=ureg.esu * ureg.cm, electric_field=ureg.dyne / ureg.esu,
-            density=ureg.g / ureg.cm ** dimension)
+            mass=ureg.g,
+            distance=ureg.cm,
+            time=ureg.s,
+            energy=ureg.erg,
+            velocity=ureg.cm / ureg.s,
+            force=ureg.dyne,
+            torque=ureg.dyne * ureg.cm,
+            temperature=ureg.K,
+            pressure=ureg.dyne / ureg.cm**2,
+            dynamic_viscosity=ureg.poise,
+            charge=ureg.esu,
+            dipole=ureg.esu * ureg.cm,
+            electric_field=ureg.dyne / ureg.esu,
+            density=ureg.g / ureg.cm**dimension,
+        )
 
-    elif units_type == 'electron':
+    elif units_type == "electron":
         units = dict(
-            mass=ureg.amu, distance=ureg.bohr, time=ureg.fs, energy=ureg.hartree,
-            velocity=ureg.bohr / ureg.atomic_unit_of_time, force=ureg.hartree / ureg.bohr, temperature=ureg.K,
-            pressure=ureg.Pa, charge=ureg.elementary_charge, dipole=ureg.debye, electric_field=ureg.V / ureg.cm)
+            mass=ureg.amu,
+            distance=ureg.bohr,
+            time=ureg.fs,
+            energy=ureg.hartree,
+            velocity=ureg.bohr / ureg.atomic_unit_of_time,
+            force=ureg.hartree / ureg.bohr,
+            temperature=ureg.K,
+            pressure=ureg.Pa,
+            charge=ureg.elementary_charge,
+            dipole=ureg.debye,
+            electric_field=ureg.V / ureg.cm,
+        )
 
-    elif units_type == 'micro':
+    elif units_type == "micro":
         units = dict(
-            mass=ureg.pg, distance=ureg.microm, time=ureg.micros, energy=ureg.pg * ureg.microm ** 2 / ureg.micros ** 2,
-            velocity=ureg.microm / ureg.micros, force=ureg.pg * ureg.microm / ureg.micros ** 2, torque=ureg.pg * ureg.microm ** 2 / ureg.micros ** 2,
-            temperature=ureg.K, pressure=ureg.pg / (ureg.microm * ureg.micros ** 2), dynamic_viscosity=ureg.pg / (ureg.microm * ureg.micros),
-            charge=ureg.pC, dipole=ureg.pC * ureg.microm, electric_field=ureg.V / ureg.microm,
-            density=ureg.pg / ureg.microm ** dimension)
+            mass=ureg.pg,
+            distance=ureg.microm,
+            time=ureg.micros,
+            energy=ureg.pg * ureg.microm**2 / ureg.micros**2,
+            velocity=ureg.microm / ureg.micros,
+            force=ureg.pg * ureg.microm / ureg.micros**2,
+            torque=ureg.pg * ureg.microm**2 / ureg.micros**2,
+            temperature=ureg.K,
+            pressure=ureg.pg / (ureg.microm * ureg.micros**2),
+            dynamic_viscosity=ureg.pg / (ureg.microm * ureg.micros),
+            charge=ureg.pC,
+            dipole=ureg.pC * ureg.microm,
+            electric_field=ureg.V / ureg.microm,
+            density=ureg.pg / ureg.microm**dimension,
+        )
 
-    elif units_type == 'nano':
+    elif units_type == "nano":
         units = dict(
-            mass=ureg.ag, distance=ureg.nm, time=ureg.ns, energy=ureg.ag * ureg.nm ** 2 / ureg.ns ** 2, velocity=ureg.nm / ureg.ns,
-            force=ureg.ag * ureg.nm / ureg.ns ** 2, torque=ureg.ag * ureg.nm ** 2 / ureg.ns ** 2, temperature=ureg.K, pressure=ureg.ag / (ureg.nm * ureg.ns ** 2),
-            dynamic_viscosity=ureg.ag / (ureg.nm * ureg.ns), charge=ureg.elementary_charge,
-            dipole=ureg.elementary_charge * ureg.nm, electric_field=ureg.V / ureg.nm, density=ureg.ag / ureg.nm ** dimension)
+            mass=ureg.ag,
+            distance=ureg.nm,
+            time=ureg.ns,
+            energy=ureg.ag * ureg.nm**2 / ureg.ns**2,
+            velocity=ureg.nm / ureg.ns,
+            force=ureg.ag * ureg.nm / ureg.ns**2,
+            torque=ureg.ag * ureg.nm**2 / ureg.ns**2,
+            temperature=ureg.K,
+            pressure=ureg.ag / (ureg.nm * ureg.ns**2),
+            dynamic_viscosity=ureg.ag / (ureg.nm * ureg.ns),
+            charge=ureg.elementary_charge,
+            dipole=ureg.elementary_charge * ureg.nm,
+            electric_field=ureg.V / ureg.nm,
+            density=ureg.ag / ureg.nm**dimension,
+        )
 
     else:
         # units = dict(
@@ -114,39 +194,80 @@ def get_unit(units_type, property_type=None, dimension=3):
 class DataParser(TextParser):
     def __init__(self):
         self._headers = [
-            'atoms', 'bonds', 'angles', 'dihedrals', 'impropers', 'atom types', 'bond types',
-            'angle types', 'dihedral types', 'improper types', 'extra bond per atom',
-            'extra/bond/per/atom', 'extra angle per atom', 'extra/angle/per/atom',
-            'extra dihedral per atom', 'extra/dihedral/per/atom', 'extra improper per atom',
-            'extra/improper/per/atom', 'extra special per atom', 'extra/special/per/atom',
-            'ellipsoids', 'lines', 'triangles', 'bodies']
+            "atoms",
+            "bonds",
+            "angles",
+            "dihedrals",
+            "impropers",
+            "atom types",
+            "bond types",
+            "angle types",
+            "dihedral types",
+            "improper types",
+            "extra bond per atom",
+            "extra/bond/per/atom",
+            "extra angle per atom",
+            "extra/angle/per/atom",
+            "extra dihedral per atom",
+            "extra/dihedral/per/atom",
+            "extra improper per atom",
+            "extra/improper/per/atom",
+            "extra special per atom",
+            "extra/special/per/atom",
+            "ellipsoids",
+            "lines",
+            "triangles",
+            "bodies",
+        ]
         self._sections = [
-            'Atoms', 'Velocities', 'Masses', 'Ellipsoids', 'Lines', 'Triangles', 'Bodies',
-            'Bonds', 'Angles', 'Dihedrals', 'Impropers', 'Pair Coeffs', 'PairIJ Coeffs',
-            'Bond Coeffs', 'Angle Coeffs', 'Dihedral Coeffs', 'Improper Coeffs',
-            'BondBond Coeffs', 'BondAngle Coeffs', 'MiddleBondTorsion Coeffs',
-            'EndBondTorsion Coeffs', 'AngleTorsion Coeffs', 'AngleAngleTorsion Coeffs',
-            'BondBond13 Coeffs', 'AngleAngle Coeffs']
+            "Atoms",
+            "Velocities",
+            "Masses",
+            "Ellipsoids",
+            "Lines",
+            "Triangles",
+            "Bodies",
+            "Bonds",
+            "Angles",
+            "Dihedrals",
+            "Impropers",
+            "Pair Coeffs",
+            "PairIJ Coeffs",
+            "Bond Coeffs",
+            "Angle Coeffs",
+            "Dihedral Coeffs",
+            "Improper Coeffs",
+            "BondBond Coeffs",
+            "BondAngle Coeffs",
+            "MiddleBondTorsion Coeffs",
+            "EndBondTorsion Coeffs",
+            "AngleTorsion Coeffs",
+            "AngleAngleTorsion Coeffs",
+            "BondBond13 Coeffs",
+            "AngleAngle Coeffs",
+        ]
         self._interactions = [
-            section for section in self._sections if section.endswith('Coeffs')]
+            section for section in self._sections if section.endswith("Coeffs")
+        ]
         super().__init__(None)
 
     def init_quantities(self):
-        self._quantities = [Quantity(
-            header, rf'{re_n} *(\d+) +{header}', repeats=True, dtype=np.int32
-        ) for header in self._headers]
+        self._quantities = [
+            Quantity(header, rf"{re_n} *(\d+) +{header}", repeats=True, dtype=np.int32)
+            for header in self._headers
+        ]
 
         def get_section_value(val):
             val = val.strip().splitlines()
             name = None
 
-            if val[0][0] == '#':
+            if val[0][0] == "#":
                 name = val[0][1:].strip()
                 val = val[1:]
 
             value = []
             for i in range(len(val)):
-                v = val[i].split('#')[0].split()
+                v = val[i].split("#")[0].split()
                 if not v:
                     continue
 
@@ -157,9 +278,17 @@ def get_section_value(val):
 
             return name, np.array(value)
 
-        self._quantities.extend([Quantity(
-            section, rf'{section} *(#*.*{re_n}\s+(?:[\d ]+{re_float}.+\s+)+)',
-            str_operation=get_section_value, repeats=True) for section in self._sections])
+        self._quantities.extend(
+            [
+                Quantity(
+                    section,
+                    rf"{section} *(#*.*{re_n}\s+(?:[\d ]+{re_float}.+\s+)+)",
+                    str_operation=get_section_value,
+                    repeats=True,
+                )
+                for section in self._sections
+            ]
+        )
 
     def get_interactions(self):
         styles_coeffs = []
@@ -179,16 +308,16 @@ class TrajParser(TextParser):
     def __init__(self):
         self._masses = None
         self._reference_masses = dict(
-            masses=np.array(asedata.atomic_masses), symbols=asedata.chemical_symbols)
+            masses=np.array(asedata.atomic_masses), symbols=asedata.chemical_symbols
+        )
         self._chemical_symbols = None
         super().__init__(None)
 
     def init_quantities(self):
-
         def get_pbc_cell(val):
             val = val.split()
 
-            pbc = [v == 'pp' for v in val[:3]]
+            pbc = [v == "pp" for v in val[:3]]
 
             cell = np.zeros((3, 3))
             for i in range(3):
@@ -197,7 +326,7 @@ def get_pbc_cell(val):
             return pbc, cell
 
         def get_atoms_info(val):
-            val = val.split('\n')
+            val = val.split("\n")
             keys = val[0].split()
             values = np.array([v.split() for v in val[1:] if v], dtype=float)
             values = values[values[:, 0].argsort()].T
@@ -205,26 +334,40 @@ def get_atoms_info(val):
 
         self._quantities = [
             Quantity(
-                'time_step', r'\s*ITEM:\s*TIMESTEP\s*\n\s*(\d+)\s*\n', comment='#',
-                repeats=True),
+                "time_step",
+                r"\s*ITEM:\s*TIMESTEP\s*\n\s*(\d+)\s*\n",
+                comment="#",
+                repeats=True,
+            ),
             Quantity(
-                'n_atoms', r'\s*ITEM:\s*NUMBER OF ATOMS\s*\n\s*(\d+)\s*\n', comment='#',
-                repeats=True),
+                "n_atoms",
+                r"\s*ITEM:\s*NUMBER OF ATOMS\s*\n\s*(\d+)\s*\n",
+                comment="#",
+                repeats=True,
+            ),
             Quantity(
-                'pbc_cell', r'\s*ITEM: BOX BOUNDS\s*([\s\w]+)\n([\+\-\d\.eE\s]+)\n',
-                str_operation=get_pbc_cell, comment='#', repeats=True),
+                "pbc_cell",
+                r"\s*ITEM: BOX BOUNDS\s*([\s\w]+)\n([\+\-\d\.eE\s]+)\n",
+                str_operation=get_pbc_cell,
+                comment="#",
+                repeats=True,
+            ),
             Quantity(
-                'atoms_info', r'\s*ITEM:\s*ATOMS\s*([ \w]+\n)*?([\+\-eE\d\.\n ]+)',
-                str_operation=get_atoms_info, comment='#', repeats=True)
+                "atoms_info",
+                r"\s*ITEM:\s*ATOMS\s*([ \w]+\n)*?([\+\-eE\d\.\n ]+)",
+                str_operation=get_atoms_info,
+                comment="#",
+                repeats=True,
+            ),
         ]
 
     @property
     def with_trajectory(self):
-        return self.get('atoms_info') is not None
+        return self.get("atoms_info") is not None
 
     @property
     def n_frames(self):
-        return len(self.get('atoms_info', []))
+        return len(self.get("atoms_info", []))
 
     @property
     def masses(self):
@@ -241,60 +384,72 @@ def masses(self, val):
             masses = self._masses[0][1]
             self._chemical_symbols = {}
             for i in range(len(masses)):
-                symbol_idx = np.argmin(abs(self._reference_masses['masses'] - masses[i][1]))
-                self._chemical_symbols[masses[i][0]] = self._reference_masses['symbols'][symbol_idx]
+                symbol_idx = np.argmin(
+                    abs(self._reference_masses["masses"] - masses[i][1])
+                )
+                self._chemical_symbols[masses[i][0]] = self._reference_masses[
+                    "symbols"
+                ][symbol_idx]
 
     def get_atom_labels(self, idx):
-        atoms_info = self.get('atoms_info')
+        atoms_info = self.get("atoms_info")
         if atoms_info is None:
             return
 
-        atoms_type = atoms_info[idx].get('type')
+        atoms_id = atoms_info[idx].get("id")
+        default = ["X" for _ in atoms_id] if atoms_id is not None else None
+        atoms_type = atoms_info[idx].get("type")
         if atoms_type is None:
-            return
-
+            return default
         if self._chemical_symbols is None:
-            return
+            return default
 
         try:
             atom_labels = [self._chemical_symbols[atype] for atype in atoms_type]
         except Exception:
-            self.logger.error('Error resolving atom labels.')
+            self.logger.error("Error resolving atom labels.")
             return
 
         return atom_labels
 
     def get_positions(self, idx):
-        atoms_info = self.get('atoms_info')
+        atoms_info = self.get("atoms_info")
         if atoms_info is None:
             return
 
         atoms_info = atoms_info[idx]
 
-        cell = self.get('pbc_cell')
+        cell = self.get("pbc_cell")
         cell = None if cell is None else cell[idx][1]
-        if 'xs' in atoms_info and 'ys' in atoms_info and 'zs' in atoms_info:
+        if "xs" in atoms_info and "ys" in atoms_info and "zs" in atoms_info:
             if cell is None:
                 return
-            positions = np.array([atoms_info['xs'], atoms_info['ys'], atoms_info['zs']]).T
+            positions = np.array(
+                [atoms_info["xs"], atoms_info["ys"], atoms_info["zs"]]
+            ).T
             positions = positions * np.linalg.norm(cell, axis=1) + np.amin(cell, axis=1)
 
-        elif 'xu' in atoms_info and 'yu' in atoms_info and 'zu' in atoms_info:
-            positions = np.array([atoms_info['xu'], atoms_info['yu'], atoms_info['zu']]).T
+        elif "xu" in atoms_info and "yu" in atoms_info and "zu" in atoms_info:
+            positions = np.array(
+                [atoms_info["xu"], atoms_info["yu"], atoms_info["zu"]]
+            ).T
 
-        elif 'xsu' in atoms_info and 'ysu' in atoms_info and 'zsu' in atoms_info:
+        elif "xsu" in atoms_info and "ysu" in atoms_info and "zsu" in atoms_info:
             if cell is None:
                 return
-            positions = np.array([atoms_info['xsu'], atoms_info['ysu'], atoms_info['zsu']]).T
+            positions = np.array(
+                [atoms_info["xsu"], atoms_info["ysu"], atoms_info["zsu"]]
+            ).T
             positions = positions * np.linalg.norm(cell, axis=1) + np.amin(cell, axis=1)
 
-        elif 'x' in atoms_info and 'y' in atoms_info and 'z' in atoms_info:
-            positions = np.array([atoms_info['x'], atoms_info['y'], atoms_info['z']]).T
-            if 'ix' in atoms_info and 'iy' in atoms_info and 'iz' in atoms_info:
+        elif "x" in atoms_info and "y" in atoms_info and "z" in atoms_info:
+            positions = np.array([atoms_info["x"], atoms_info["y"], atoms_info["z"]]).T
+            if "ix" in atoms_info and "iy" in atoms_info and "iz" in atoms_info:
                 if cell is None:
                     return
-                positions_img = np.array([
-                    atoms_info['ix'], atoms_info['iy'], atoms_info['iz']]).T
+                positions_img = np.array(
+                    [atoms_info["ix"], atoms_info["iy"], atoms_info["iz"]]
+                ).T
 
                 positions += positions_img * np.linalg.norm(cell, axis=1)
         else:
@@ -303,44 +458,44 @@ def get_positions(self, idx):
         return positions
 
     def get_velocities(self, idx):
-        atoms_info = self.get('atoms_info')
+        atoms_info = self.get("atoms_info")
         if atoms_info is None:
             return
         atoms_info = atoms_info[idx]
-        if 'vx' not in atoms_info or 'vy' not in atoms_info or 'vz' not in atoms_info:
+        if "vx" not in atoms_info or "vy" not in atoms_info or "vz" not in atoms_info:
             return
 
-        return np.array([atoms_info['vx'], atoms_info['vy'], atoms_info['vz']]).T
+        return np.array([atoms_info["vx"], atoms_info["vy"], atoms_info["vz"]]).T
 
     def get_forces(self, idx):
-        atoms_info = self.get('atoms_info')
+        atoms_info = self.get("atoms_info")
         if atoms_info is None:
             return
         atoms_info = atoms_info[idx]
-        if 'fx' not in atoms_info or 'fy' not in atoms_info or 'fz' not in atoms_info:
+        if "fx" not in atoms_info or "fy" not in atoms_info or "fz" not in atoms_info:
             return
-        return np.array([atoms_info['fx'], atoms_info['fy'], atoms_info['fz']]).T
+        return np.array([atoms_info["fx"], atoms_info["fy"], atoms_info["fz"]]).T
 
     def get_lattice_vectors(self, idx):
-        pbc_cell = self.get('pbc_cell')
+        pbc_cell = self.get("pbc_cell")
         if pbc_cell is None:
             return
         return pbc_cell[idx][1]
 
     def get_pbc(self, idx):
-        pbc_cell = self.get('pbc_cell')
+        pbc_cell = self.get("pbc_cell")
         if pbc_cell is None:
             return
         return pbc_cell[idx][0]
 
     def get_n_atoms(self, idx):
-        n_atoms = self.get('n_atoms')
+        n_atoms = self.get("n_atoms")
         if n_atoms is None:
             return len(self.get_positions(idx))
         return n_atoms[idx]
 
     def get_step(self, idx):
-        step = self.get('time_step')
+        step = self.get("time_step")
         if step is None:
             return
         return step[idx]
@@ -351,9 +506,8 @@ def __init__(self):
         super().__init__()
 
     def init_quantities(self):
-
         def get_atoms_info(val_in):
-            val = [v.split('#')[0].split() for v in val_in.strip().split('\n')]
+            val = [v.split("#")[0].split() for v in val_in.strip().split("\n")]
             symbols = []
             for v in val:
                 if v[0].isalpha():
@@ -367,67 +521,186 @@ def get_atoms_info(val_in):
 
         self.quantities = [
             Quantity(
-                'atoms_info', r'((?:\d+|[A-Z][a-z]?) [\s\S]+?)(?:\s\d+\n|\Z)',
-                str_operation=get_atoms_info, comment='#', repeats=True)
+                "atoms_info",
+                r"((?:\d+|[A-Z][a-z]?) [\s\S]+?)(?:\s\d+\n|\Z)",
+                str_operation=get_atoms_info,
+                comment="#",
+                repeats=True,
+            )
         ]
 
 
 class LogParser(TextParser):
     def __init__(self):
         self._commands = [
-            'angle_coeff', 'angle_style', 'atom_modify', 'atom_style', 'balance',
-            'bond_coeff', 'bond_style', 'bond_write', 'boundary', 'change_box', 'clear',
-            'comm_modify', 'comm_style', 'compute', 'compute_modify', 'create_atoms',
-            'create_bonds', 'create_box', 'delete_bonds', 'dielectric', 'dihedral_coeff',
-            'dihedral_style', 'dimension', 'displace_atoms', 'dump', 'dump_modify',
-            'dynamical_matrix', 'echo', 'fix', 'fix_modify', 'group', 'group2ndx',
-            'ndx2group', 'hyper', 'if', 'improper_coeff', 'improper_style', 'include',
-            'info', 'jump', 'kim_init', 'kim_interactions', 'kim_query', 'kim_param',
-            'kim_property', 'kspace_modify', 'kspace_style', 'label', 'lattice', 'log',
-            'mass', 'message', 'min_modify', 'min_style', 'minimize', 'minimize/kk',
-            'molecule', 'neb', 'neb/spin', 'neigh_modify', 'neighbor', 'newton', 'next',
-            'package', 'pair_coeff', 'pair_modify', 'pair_style', 'pair_write',
-            'partition', 'prd', 'print', 'processors', 'quit', 'read_data', 'read_dump',
-            'read_restart', 'region', 'replicate', 'rerun', 'reset_atom_ids',
-            'reset_mol_ids', 'reset_timestep', 'restart', 'run', 'run_style', 'server',
-            'set', 'shell', 'special_bonds', 'suffix', 'tad', 'temper/grem', 'temper/npt',
-            'thermo', 'thermo_modify', 'thermo_style', 'third_order', 'timer', 'timestep',
-            'uncompute', 'undump', 'unfix', 'units', 'variable', 'velocity', 'write_coeff',
-            'write_data', 'write_dump', 'write_restart']
+            "angle_coeff",
+            "angle_style",
+            "atom_modify",
+            "atom_style",
+            "balance",
+            "bond_coeff",
+            "bond_style",
+            "bond_write",
+            "boundary",
+            "change_box",
+            "clear",
+            "comm_modify",
+            "comm_style",
+            "compute",
+            "compute_modify",
+            "create_atoms",
+            "create_bonds",
+            "create_box",
+            "delete_bonds",
+            "dielectric",
+            "dihedral_coeff",
+            "dihedral_style",
+            "dimension",
+            "displace_atoms",
+            "dump",
+            "dump_modify",
+            "dynamical_matrix",
+            "echo",
+            "fix",
+            "fix_modify",
+            "group",
+            "group2ndx",
+            "ndx2group",
+            "hyper",
+            "if",
+            "improper_coeff",
+            "improper_style",
+            "include",
+            "info",
+            "jump",
+            "kim_init",
+            "kim_interactions",
+            "kim_query",
+            "kim_param",
+            "kim_property",
+            "kspace_modify",
+            "kspace_style",
+            "label",
+            "lattice",
+            "log",
+            "mass",
+            "message",
+            "min_modify",
+            "min_style",
+            "minimize",
+            "minimize/kk",
+            "molecule",
+            "neb",
+            "neb/spin",
+            "neigh_modify",
+            "neighbor",
+            "newton",
+            "next",
+            "package",
+            "pair_coeff",
+            "pair_modify",
+            "pair_style",
+            "pair_write",
+            "partition",
+            "prd",
+            "print",
+            "processors",
+            "quit",
+            "read_data",
+            "read_dump",
+            "read_restart",
+            "region",
+            "replicate",
+            "rerun",
+            "reset_atom_ids",
+            "reset_mol_ids",
+            "reset_timestep",
+            "restart",
+            "run",
+            "run_style",
+            "server",
+            "set",
+            "shell",
+            "special_bonds",
+            "suffix",
+            "tad",
+            "temper/grem",
+            "temper/npt",
+            "thermo",
+            "thermo_modify",
+            "thermo_style",
+            "third_order",
+            "timer",
+            "timestep",
+            "uncompute",
+            "undump",
+            "unfix",
+            "units",
+            "variable",
+            "velocity",
+            "write_coeff",
+            "write_data",
+            "write_dump",
+            "write_restart",
+        ]
         self._interactions = [
-            'atom', 'pair', 'bond', 'angle', 'dihedral', 'improper', 'kspace']
+            "atom",
+            "pair",
+            "bond",
+            "angle",
+            "dihedral",
+            "improper",
+            "kspace",
+        ]
         self._units = None
         super().__init__(None)
 
     def init_quantities(self):
         def str_op(val):
-            val = val.split('#')[0]
-            val = val.replace('&\n', ' ').split()
+            val = val.split("#")[0]
+            val = val.replace("&\n", " ").split()
             val = val if len(val) > 1 else val[0]
             return val
 
         self._quantities = [
             Quantity(
-                name, r'\n\s*%s\s+([\w\. \/\#\-]+)(\&\n[\w\. \/\#\-]*)*' % name,
-                str_operation=str_op, comment='#', repeats=True) for name in self._commands]
+                name,
+                r"\n\s*%s\s+([\w\. \/\#\-]+)(\&\n[\w\. \/\#\-]*)*" % name,
+                str_operation=str_op,
+                comment="#",
+                repeats=True,
+            )
+            for name in self._commands
+        ]
 
-        self._quantities.append(Quantity(
-            'program_version', r'\s*LAMMPS\s*\(([\w ]+)\)\n', dtype=str, repeats=False,
-            flatten=False)
+        self._quantities.append(
+            Quantity(
+                "program_version",
+                r"\s*LAMMPS\s*\(([\w ]+)\)\n",
+                dtype=str,
+                repeats=False,
+                flatten=False,
+            )
         )
 
-        self._quantities.append(Quantity(
-            'finished', r'\s*Dangerous builds\s*=\s*(\d+)', repeats=False)
+        self._quantities.append(
+            Quantity("finished", r"\s*Dangerous builds\s*=\s*(\d+)", repeats=False)
         )
 
-        self._quantities.append(Quantity(
-            'minimization_stats', r'\s*Minimization stats:\s*([\s\S]+?)\n\n', flatten=False)
+        self._quantities.append(
+            Quantity(
+                "minimization_stats",
+                r"\s*Minimization stats:\s*([\s\S]+?)\n\n",
+                flatten=False,
+            )
         )
 
         def str_to_thermo(val):
             res = {}
-            if val.count('Step') > 1:
-                val = val.replace('--', '').replace('=', '').replace('(sec)', '').split()
+            if val.count("Step") > 1:
+                val = (
+                    val.replace("--", "").replace("=", "").replace("(sec)", "").split()
+                )
                 val = [v.strip() for v in val]
 
                 for i in range(len(val)):
@@ -436,7 +709,7 @@ def str_to_thermo(val):
                         res[val[i]].append(float(val[i + 1]))
 
             else:
-                val = val.split('\n')
+                val = val.split("\n")
                 keys = [v.strip() for v in val[0].split()]
                 val = np.array([v.split() for v in val[1:] if v], dtype=float).T
 
@@ -446,20 +719,25 @@ def str_to_thermo(val):
 
             return res
 
-        self._quantities.append(Quantity(
-            'thermo_data', r'\s*\-*(\s*Step\s*[\-\s\w\.\=\(\)]*[ \-\.\d\n]+)Loop',
-            str_operation=str_to_thermo, repeats=False, convert=False)
+        self._quantities.append(
+            Quantity(
+                "thermo_data",
+                r"\s*\-*(\s*Step\s*[\-\s\w\.\=\(\)]*[ \-\.\d\n]+)Loop",
+                str_operation=str_to_thermo,
+                repeats=False,
+                convert=False,
+            )
         )
 
     @property
     def units(self):
         if self._units is None:
-            units_type = self.get('units', ['lj'])[0]
+            units_type = self.get("units", ["lj"])[0]
             self._units = get_unit(units_type)
         return self._units
 
     def get_thermodynamic_data(self):
-        thermo_data = self.get('thermo_data')
+        thermo_data = self.get("thermo_data")
 
         if thermo_data is None:
             return
@@ -467,45 +745,57 @@ def get_thermodynamic_data(self):
         data = {}
         for key, val in thermo_data.items():
             low_key = key.lower()
-            if low_key.startswith('e_') or low_key.endswith('eng'):
-                data[key] = val * self.units.get('energy', 1)
-            elif low_key == 'press':
-                data[key] = val * self.units.get('pressure', 1)
-            elif low_key == 'temp':
-                data[key] = val * self.units.get('temperature', 1)
+            if low_key.startswith("e_") or low_key.endswith("eng"):
+                data[key] = val * self.units.get("energy", 1)
+            elif low_key == "press":
+                data[key] = val * self.units.get("pressure", 1)
+            elif low_key == "temp":
+                data[key] = val * self.units.get("temperature", 1)
             else:
                 data[key] = val
         return data
 
     def get_traj_files(self):
-        dump = self.get('dump')
+        dump = self.get("dump")
         if dump is None:
-            self.logger.warning('Trajectory not specified in directory, will scan.')
+            self.logger.warning("Trajectory not specified in directory, will scan.")
             # TODO improve matching of traj file
             traj_files = os.listdir(self.maindir)
-            traj_files = [f for f in traj_files if f.endswith('trj') or f.endswith('xyz')]
+            traj_files = [
+                f for f in traj_files if f.endswith("trj") or f.endswith("xyz")
+            ]
             # further eliminate
             if len(traj_files) > 1:
-                prefix = os.path.basename(self.mainfile).rsplit('.', 1)[0]
+                prefix = os.path.basename(self.mainfile).rsplit(".", 1)[0]
                 traj_files = [f for f in traj_files if prefix in f]
         else:
             traj_files = []
             if type(dump[0]) in [str, int]:
                 dump = [dump]
             traj_files = [d[4] for d in dump]
-        traj_files = [i for n, i in enumerate(traj_files) if i not in traj_files[:n]]  # remove duplicates
+        traj_files = [
+            i for n, i in enumerate(traj_files) if i not in traj_files[:n]
+        ]  # remove duplicates
 
         return [os.path.join(self.maindir, f) for f in traj_files]
 
     def get_data_files(self):
-        read_data = self.get('read_data')
-        if read_data is None or 'CPU' in read_data:
-            self.logger.warning('Data file not specified in directory, will scan.')
+        read_data = self.get("read_data")
+        if read_data is None or "CPU" in read_data:
+            self.logger.warning("Data file not specified in directory, will scan.")
             # TODO improve matching of data file
             data_files = os.listdir(self.maindir)
-            data_files = [f for f in data_files if f.endswith('data') or f.startswith('data')]
+            data_files = [
+                f for f in data_files if f.endswith("data") or f.startswith("data")
+            ]
             if len(data_files) > 1:
-                prefix = os.path.basename(self.mainfile).rsplit('.', 1)[1]  # JFR- @Alvin Please check this - changed from [0] to [1] for case that filename is leading with log
+                prefix = os.path.basename(
+                    self.mainfile
+                ).rsplit(
+                    ".", 1
+                )[
+                    1
+                ]  # JFR- @Alvin Please check this - changed from [0] to [1] for case that filename is leading with log
                 data_files = [f for f in data_files if prefix in f]
         else:
             data_files = read_data
@@ -513,17 +803,19 @@ def get_data_files(self):
         return [os.path.join(self.maindir, f) for f in data_files]
 
     def get_pbc(self):
-        pbc = self.get('boundary', ['p', 'p', 'p'])
-        return [v == 'p' for v in pbc]
+        pbc = self.get("boundary", ["p", "p", "p"])
+        return [v == "p" for v in pbc]
 
     def get_sampling_method(self):
-        fix_style = self.get('fix', [[''] * 3])[0][2]
+        fix_style = self.get("fix", [[""] * 3])[0][2]
 
-        sampling_method = 'langevin_dynamics' if 'langevin' in fix_style else 'molecular_dynamics'
+        sampling_method = (
+            "langevin_dynamics" if "langevin" in fix_style else "molecular_dynamics"
+        )
         return sampling_method, fix_style
 
     def get_thermostat_settings(self):
-        fix = self.get('fix', [None])[0]
+        fix = self.get("fix", [None])[0]
         if fix is None:
             return {}
 
@@ -532,50 +824,50 @@ def get_thermostat_settings(self):
         except IndexError:
             return {}
 
-        temp_unit = self.units.get('temperature', 1)
-        press_unit = self.units.get('pressure', 1)
-        time_unit = self.units.get('time', 1)
+        temp_unit = self.units.get("temperature", 1)
+        press_unit = self.units.get("pressure", 1)
+        time_unit = self.units.get("time", 1)
 
         res = dict()
-        if fix_style.lower() == 'nvt':
+        if fix_style.lower() == "nvt":
             try:
-                res['target_T'] = float(fix[5]) * temp_unit
-                res['thermostat_tau'] = float(fix[6]) * time_unit
+                res["target_T"] = float(fix[5]) * temp_unit
+                res["thermostat_tau"] = float(fix[6]) * time_unit
             except Exception:
                 pass
 
-        elif fix_style.lower() == 'npt':
+        elif fix_style.lower() == "npt":
             try:
-                res['target_T'] = float(fix[5]) * temp_unit
-                res['thermostat_tau'] = float(fix[6]) * time_unit
-                res['target_P'] = float(fix[9]) * press_unit
-                res['barostat_tau'] = float(fix[10]) * time_unit
+                res["target_T"] = float(fix[5]) * temp_unit
+                res["thermostat_tau"] = float(fix[6]) * time_unit
+                res["target_P"] = float(fix[9]) * press_unit
+                res["barostat_tau"] = float(fix[10]) * time_unit
             except Exception:
                 pass
 
-        elif fix_style.lower() == 'nph':
+        elif fix_style.lower() == "nph":
             try:
-                res['target_P'] = float(fix[5]) * press_unit
-                res['barostat_tau'] = float(fix[6]) * time_unit
+                res["target_P"] = float(fix[5]) * press_unit
+                res["barostat_tau"] = float(fix[6]) * time_unit
             except Exception:
                 pass
 
-        elif fix_style.lower() == 'langevin':
+        elif fix_style.lower() == "langevin":
             try:
-                res['target_T'] = float(fix[4]) * temp_unit
-                res['langevin_gamma'] = float(fix[5]) * time_unit
+                res["target_T"] = float(fix[4]) * temp_unit
+                res["langevin_gamma"] = float(fix[5]) * time_unit
             except Exception:
                 pass
 
         else:
-            self.logger.warning('Fix style not supported', data=dict(style=fix_style))
+            self.logger.warning("Fix style not supported", data=dict(style=fix_style))
 
         return res
 
     def get_interactions(self):
         styles_coeffs = []
         for interaction in self._interactions:
-            styles = self.get('%s_style' % interaction, None)
+            styles = self.get("%s_style" % interaction, None)
             if styles is None:
                 continue
 
@@ -583,13 +875,13 @@ def get_interactions(self):
                 styles = [styles]
 
             for i in range(len(styles)):
-                if interaction == 'kspace':
+                if interaction == "kspace":
                     coeff = [[float(c) for c in styles[i][1:]]]
                     style = styles[i][0]
 
                 else:
                     coeff = self.get("%s_coeff" % interaction)
-                    style = ' '.join([str(si) for si in styles[i]])
+                    style = " ".join([str(si) for si in styles[i]])
 
                 styles_coeffs.append((style.strip(), coeff))
 
@@ -610,7 +902,9 @@ def eval(self, key, *args, **kwargs):
         for parser in self._parsers:
             parser_method = getattr(parser, key)
             if parser_method is not None:
-                val = parser_method(*args, **kwargs) if args or kwargs else parser_method
+                val = (
+                    parser_method(*args, **kwargs) if args or kwargs else parser_method
+                )
                 if val is not None:
                     return val
 
@@ -621,18 +915,29 @@ def __init__(self):
         self.log_parser = LogParser()
         self._traj_parser = TrajParser()
         self._xyztraj_parser = XYZTrajParser()
-        self._mdanalysistraj_parser = MDAnalysisParser(topology_format='DATA', format='LAMMPSDUMP')
+        self._mdanalysistraj_parser = MDAnalysisParser(
+            topology_format="DATA", format="LAMMPSDUMP"
+        )
         self.data_parser = DataParser()
         self.aux_log_parser = LogParser()
         self._energy_mapping = {
-            'e_pair': 'pair', 'e_bond': 'bond', 'e_angle': 'angle', 'e_dihed': 'dihedral',
-            'e_impro': 'improper', 'e_coul': 'coulomb', 'e_vdwl': 'van der Waals',
-            'e_mol': 'molecular', 'e_long': 'kspace long range',
-            'e_tail': 'van der Waals long range', 'kineng': 'kinetic', 'poteng': 'potential'}
+            "e_pair": "pair",
+            "e_bond": "bond",
+            "e_angle": "angle",
+            "e_dihed": "dihedral",
+            "e_impro": "improper",
+            "e_coul": "coulomb",
+            "e_vdwl": "van der Waals",
+            "e_mol": "molecular",
+            "e_long": "kspace long range",
+            "e_tail": "van der Waals long range",
+            "kineng": "kinetic",
+            "poteng": "potential",
+        }
 
     def get_time_step(self):
-        time_unit = self.log_parser.units.get('time', None)
-        time_step = self.log_parser.get('timestep', [0], unit=time_unit)[0]
+        time_unit = self.log_parser.units.get("time", None)
+        time_step = self.log_parser.get("timestep", [0], unit=time_unit)[0]
         return time_step
 
     def parse_thermodynamic_data(self):
@@ -645,106 +950,158 @@ def parse_thermodynamic_data(self):
             thermo_data = self.aux_log_parser.get_thermodynamic_data()
         if not thermo_data:
             thermo_data = {}
-        self.thermodynamics_steps = [int(n) for n in thermo_data.get('Step', [])]
+        self.thermodynamics_steps = [int(n) for n in thermo_data.get("Step", [])]
 
         if not thermo_data:
             return
 
         for step in self.thermodynamics_steps:
             step_data = {
-                'step': step,
-                'time': step * time_step,
-                'method_ref': sec_run.method[-1] if sec_run.method else None,
-                'energy': {
-                    'contributions': []
-                }
+                "step": step,
+                "time": step * time_step,
+                "method_ref": sec_run.method[-1] if sec_run.method else None,
+                "energy": {"contributions": []},
             }
             if step in self._trajectory_steps:
-                step_data['forces'] = dict(total=dict(
-                    value=self.traj_parsers.eval('get_forces', self._trajectory_steps.index(step)))),
+                step_data["forces"] = (
+                    dict(
+                        total=dict(
+                            value=self.traj_parsers.eval(
+                                "get_forces", self._trajectory_steps.index(step)
+                            )
+                        )
+                    ),
+                )
 
             data_n = self._thermodynamics_steps.index(step)
             for key, val in thermo_data.items():
                 key = key.lower()
                 if (kind := self._energy_mapping.get(key)) is not None:
-                    step_data['energy']['contributions'].append(dict(kind=kind, value=val[data_n]))
-                elif key == 'toteng':
-                    step_data['energy']['current'] = dict(value=val[data_n])
-                    step_data['energy']['total'] = dict(value=val[data_n])
-                elif key == 'press':
-                    step_data['pressure'] = val[data_n]
-                elif key == 'temp':
-                    step_data['temperature'] = val[data_n]
-                elif key == 'cpu':
+                    step_data["energy"]["contributions"].append(
+                        dict(kind=kind, value=val[data_n])
+                    )
+                elif key == "toteng":
+                    step_data["energy"]["current"] = dict(value=val[data_n])
+                    step_data["energy"]["total"] = dict(value=val[data_n])
+                elif key == "press":
+                    step_data["pressure"] = val[data_n]
+                elif key == "temp":
+                    step_data["temperature"] = val[data_n]
+                elif key == "cpu":
                     # approx time calc is dt / dstep
                     max_step = len(self._thermodynamics_steps) - 1
                     # calc time cannot be calculated for last iter, will be zero
-                    delta_time = float(val[min(data_n + 1, max_step)]) - float(val[data_n])
-                    delta_step = 1 if data_n == max_step else self._thermodynamics_steps[data_n + 1] - step
-                    step_data['time_calculation'] = delta_time * ureg.s / delta_step
-                    step_data['time_physical'] = float(val[data_n]) * ureg.s + step_data['time_calculation']
+                    delta_time = float(val[min(data_n + 1, max_step)]) - float(
+                        val[data_n]
+                    )
+                    delta_step = (
+                        1
+                        if data_n == max_step
+                        else self._thermodynamics_steps[data_n + 1] - step
+                    )
+                    step_data["time_calculation"] = delta_time * ureg.s / delta_step
+                    step_data["time_physical"] = (
+                        float(val[data_n]) * ureg.s + step_data["time_calculation"]
+                    )
 
             self.parse_thermodynamics_step(step_data)
 
     def parse_workflow(self):
         sec_run = self.archive.run[-1]
-        sec_calc = sec_run.get('calculation')
+        sec_calc = sec_run.get("calculation")
         sec_lammps = sec_run.x_lammps_section_control_parameters[-1]
 
         units = self.log_parser.units
         if not units:
-            self.logger.warning('Unit information not available. Assuming "real" units in workflow metainfo!')
-            units = get_unit('real')
-        energy_conversion = ureg.convert(1.0, units.get('energy'), ureg.joule)
-        force_conversion = ureg.convert(1.0, units.get('force'), ureg.newton)
-        temperature_conversion = ureg.convert(1.0, units.get('temperature'), ureg.kelvin)
-        pressure_conversion = ureg.convert(1.0, units.get('pressure'), ureg.pascal)
-
-        minimization_stats = self.log_parser.get('minimization_stats', None)
+            self.logger.warning(
+                'Unit information not available. Assuming "real" units in workflow metainfo!'
+            )
+            units = get_unit("real")
+        energy_conversion = ureg.convert(1.0, units.get("energy"), ureg.joule)
+        force_conversion = ureg.convert(1.0, units.get("force"), ureg.newton)
+        temperature_conversion = ureg.convert(
+            1.0, units.get("temperature"), ureg.kelvin
+        )
+        pressure_conversion = ureg.convert(1.0, units.get("pressure"), ureg.pascal)
+
+        minimization_stats = self.log_parser.get("minimization_stats", None)
         workflow = None
         if minimization_stats is not None:
             workflow = GeometryOptimization(
-                method=GeometryOptimizationMethod(), results=GeometryOptimizationResults())
-            workflow.method.type = 'atomic'
-
-            min_style = self.log_parser.get('min_style')
-            min_style = min_style[0].lower() if min_style else 'none'
-            min_style_map = {'cg': 'polak_ribiere_conjugant_gradient',
-                             'hftn': 'hessian_free_truncated_newton', 'sd': 'steepest_descent',
-                             'quickmin': 'damped_dynamics', 'fire': 'damped_dynamics',
-                             'spin': 'damped_dynamics'}
-            value = min_style_map.get(min_style, [val for key, val in min_style_map.items() if key in min_style])
-            value = value if not isinstance(value, list) else value[0] if len(value) != 0 else None
+                method=GeometryOptimizationMethod(),
+                results=GeometryOptimizationResults(),
+            )
+            workflow.method.type = "atomic"
+
+            min_style = self.log_parser.get("min_style")
+            min_style = min_style[0].lower() if min_style else "none"
+            min_style_map = {
+                "cg": "polak_ribiere_conjugant_gradient",
+                "hftn": "hessian_free_truncated_newton",
+                "sd": "steepest_descent",
+                "quickmin": "damped_dynamics",
+                "fire": "damped_dynamics",
+                "spin": "damped_dynamics",
+            }
+            value = min_style_map.get(
+                min_style,
+                [val for key, val in min_style_map.items() if key in min_style],
+            )
+            value = (
+                value
+                if not isinstance(value, list)
+                else value[0]
+                if len(value) != 0
+                else None
+            )
             workflow.method.method = value
 
-            minimization_stats = minimization_stats.split('\n')
-            energy_index = [i for i, s in enumerate(minimization_stats) if 'Energy initial, next-to-last, final' in s]
+            minimization_stats = minimization_stats.split("\n")
+            energy_index = [
+                i
+                for i, s in enumerate(minimization_stats)
+                if "Energy initial, next-to-last, final" in s
+            ]
             if len(energy_index) != 0:
                 energy_stats = minimization_stats[energy_index[0] + 1].split()
-                workflow.results.final_energy_difference = (float(energy_stats[-1]) - float(energy_stats[-2])) * energy_conversion
-
-            force_index = [i for i, s in enumerate(minimization_stats) if 'Force two-norm initial, final = 3167.24 0.509175' in s]
+                workflow.results.final_energy_difference = (
+                    float(energy_stats[-1]) - float(energy_stats[-2])
+                ) * energy_conversion
+
+            force_index = [
+                i
+                for i, s in enumerate(minimization_stats)
+                if "Force two-norm initial, final = 3167.24 0.509175" in s
+            ]
             if len(force_index) != 0:
-                force_stats = minimization_stats[force_index[0]].split('=')[1]
+                force_stats = minimization_stats[force_index[0]].split("=")[1]
                 force_stats = force_stats.split()
-                workflow.results.final_force_maximum = float(force_stats[-1]) * force_conversion
+                workflow.results.final_force_maximum = (
+                    float(force_stats[-1]) * force_conversion
+                )
 
-            minimize_parameters = self.log_parser.get('minimize')
+            minimize_parameters = self.log_parser.get("minimize")
             if not minimize_parameters:
-                minimize_parameters = self.log_parser.get('minimize/kk')
+                minimize_parameters = self.log_parser.get("minimize/kk")
             if minimize_parameters:
-                workflow.method.optimization_steps_maximum = int(minimize_parameters[0][2])
-                workflow.method.convergence_tolerance_force_maximum = minimize_parameters[0][1] * force_conversion
-                workflow.method.convergence_tolerance_energy_difference = minimize_parameters[0][0] * energy_conversion
+                workflow.method.optimization_steps_maximum = int(
+                    minimize_parameters[0][2]
+                )
+                workflow.method.convergence_tolerance_force_maximum = (
+                    minimize_parameters[0][1] * force_conversion
+                )
+                workflow.method.convergence_tolerance_energy_difference = (
+                    minimize_parameters[0][0] * energy_conversion
+                )
 
             energies = []
             steps = []
             for calc in sec_calc:
-                val = calc.get('energy')
-                energy = val.get('total') if val else None
+                val = calc.get("energy")
+                energy = val.get("total") if val else None
                 if energy:
                     energies.append(energy.value.magnitude)
-                    step = calc.get('step')
+                    step = calc.get("step")
                     steps.append(step)
             workflow.results.energies = energies
             workflow.results.steps = steps
@@ -753,34 +1110,46 @@ def parse_workflow(self):
 
         else:
             method, results = {}, {}
-            results['finished_normally'] = self.log_parser.get('finished') is not None
+            results["finished_normally"] = self.log_parser.get("finished") is not None
             dump_params = sec_lammps.x_lammps_inout_control_dump.split()
-            if ',' in dump_params[3]:
-                coordinate_save_frequency = dump_params[3].replace(',', '')
+            if "," in dump_params[3]:
+                coordinate_save_frequency = dump_params[3].replace(",", "")
             else:
                 coordinate_save_frequency = dump_params[3]
-            method['coordinate_save_frequency'] = int(coordinate_save_frequency)
-            method['n_steps'] = (len(sec_run.system) - 1) * method['coordinate_save_frequency']
-            if 'vx' in dump_params[7:] or 'vy' in dump_params[7:] or 'vz' in dump_params[7:]:
-                method['velocity_save_frequency'] = int(dump_params[3])
-            if 'fx' in dump_params[7:] or 'fy' in dump_params[7:] or 'fz' in dump_params[7:]:
-                method['force_save_frequency'] = int(dump_params[3])
+            method["coordinate_save_frequency"] = int(coordinate_save_frequency)
+            method["n_steps"] = (len(sec_run.system) - 1) * method[
+                "coordinate_save_frequency"
+            ]
+            if (
+                "vx" in dump_params[7:]
+                or "vy" in dump_params[7:]
+                or "vz" in dump_params[7:]
+            ):
+                method["velocity_save_frequency"] = int(dump_params[3])
+            if (
+                "fx" in dump_params[7:]
+                or "fy" in dump_params[7:]
+                or "fz" in dump_params[7:]
+            ):
+                method["force_save_frequency"] = int(dump_params[3])
             if sec_lammps.x_lammps_inout_control_thermo is not None:
-                method['thermodynamics_save_frequency'] = int(sec_lammps.x_lammps_inout_control_thermo.split()[0])
+                method["thermodynamics_save_frequency"] = int(
+                    sec_lammps.x_lammps_inout_control_thermo.split()[0]
+                )
             # runstyle has 2 options: Velocity-Verlet (default) or rRESPA Multi-Timescale
             runstyle = sec_lammps.x_lammps_inout_control_runstyle
             if runstyle is not None:
-                if 'respa' in runstyle.lower:
-                    method['integrator_type'] = 'rRESPA_multitimescale'
+                if "respa" in runstyle.lower:
+                    method["integrator_type"] = "rRESPA_multitimescale"
                 else:
-                    method['integrator_type'] = 'velocity_verlet'
+                    method["integrator_type"] = "velocity_verlet"
             else:
-                method['integrator_type'] = 'velocity_verlet'
+                method["integrator_type"] = "velocity_verlet"
             integration_timestep = self.get_time_step()
-            method['integration_timestep'] = integration_timestep
+            method["integration_timestep"] = integration_timestep
 
             thermostat_parameters, barostat_parameters = {}, {}
-            val = self.log_parser.get('fix', None)
+            val = self.log_parser.get("fix", None)
             if val is not None:
                 val_remove_duplicates = val if len(val) == 1 else []
                 val_tmp = val[0]
@@ -798,208 +1167,252 @@ def parse_workflow(self):
                     fix_group = fix[1]
                     fix_style = fix[2]
 
-                    if fix_group != 'all':  # ignore any complex settings
+                    if fix_group != "all":  # ignore any complex settings
                         continue
 
                     reference_temperature = None
                     coupling_constant = None
-                    if 'nvt' in fix_style or 'npt' in fix_style:
-                        thermostat_parameters['thermostat_type'] = 'nose_hoover'
-                        if 'temp' in fix:
-                            i_temp = np.where(fix == 'temp')[0]
+                    if "nvt" in fix_style or "npt" in fix_style:
+                        thermostat_parameters["thermostat_type"] = "nose_hoover"
+                        if "temp" in fix:
+                            i_temp = np.where(fix == "temp")[0]
                             reference_temperature = float(fix[i_temp + 2])  # stop temp
-                            coupling_constant = float(fix[i_temp + 3]) * integration_timestep
-                    elif fix_style == 'temp/berendsen':
-                        thermostat_parameters['thermostat_type'] = 'berendsen'
+                            coupling_constant = (
+                                float(fix[i_temp + 3]) * integration_timestep
+                            )
+                    elif fix_style == "temp/berendsen":
+                        thermostat_parameters["thermostat_type"] = "berendsen"
                         i_temp = 3
                         reference_temperature = float(fix[i_temp + 2])  # stop temp
-                        coupling_constant = float(fix[i_temp + 3]) * integration_timestep
-                    elif fix_style == 'temp/csvr':
-                        thermostat_parameters['thermostat_type'] = 'velocity_rescaling'
+                        coupling_constant = (
+                            float(fix[i_temp + 3]) * integration_timestep
+                        )
+                    elif fix_style == "temp/csvr":
+                        thermostat_parameters["thermostat_type"] = "velocity_rescaling"
                         i_temp = 3
                         reference_temperature = float(fix[i_temp + 2])  # stop temp
-                        coupling_constant = float(fix[i_temp + 3]) * integration_timestep
-                    elif fix_style == 'temp/csld':
-                        thermostat_parameters['thermostat_type'] = 'velocity_rescaling_langevin'
+                        coupling_constant = (
+                            float(fix[i_temp + 3]) * integration_timestep
+                        )
+                    elif fix_style == "temp/csld":
+                        thermostat_parameters[
+                            "thermostat_type"
+                        ] = "velocity_rescaling_langevin"
                         i_temp = 3
                         reference_temperature = float(fix[i_temp + 2])  # stop temp
-                        coupling_constant = float(fix[i_temp + 3]) * integration_timestep
-                    elif fix_style == 'langevin':
-                        thermostat_parameters['thermostat_type'] = 'langevin_schneider'
+                        coupling_constant = (
+                            float(fix[i_temp + 3]) * integration_timestep
+                        )
+                    elif fix_style == "langevin":
+                        thermostat_parameters["thermostat_type"] = "langevin_schneider"
                         i_temp = 3
                         reference_temperature = float(fix[i_temp + 2])  # stop temp
-                        coupling_constant = float(fix[i_temp + 3]) * integration_timestep
-                    elif 'brownian' in fix_style:
-                        thermostat_parameters['thermostat_type'] = 'brownian'
+                        coupling_constant = (
+                            float(fix[i_temp + 3]) * integration_timestep
+                        )
+                    elif "brownian" in fix_style:
+                        thermostat_parameters["thermostat_type"] = "brownian"
                         i_temp = 3
                         reference_temperature = float(fix[i_temp + 2])  # stop temp
                         # coupling_constant =  # ignore multiple coupling parameters
-                    thermostat_parameters['reference_temperature'] = reference_temperature * temperature_conversion
-                    thermostat_parameters['coupling_constant'] = coupling_constant
+                    thermostat_parameters["reference_temperature"] = (
+                        reference_temperature * temperature_conversion
+                    )
+                    thermostat_parameters["coupling_constant"] = coupling_constant
 
                     barostat_type = None
-                    if 'npt' in fix_style or 'nph' in fix_style:
+                    if "npt" in fix_style or "nph" in fix_style:
                         coupling_constant = np.zeros(shape=(3, 3))
                         reference_pressure = np.zeros(shape=(3, 3))
                         compressibility = None
-                        barostat_type = 'nose_hoover'
-                        if 'iso' in fix:
-                            i_baro = np.where(fix == 'iso')[0]
-                            barostat_parameters['coupling_type'] = 'isotropic'
+                        barostat_type = "nose_hoover"
+                        if "iso" in fix:
+                            i_baro = np.where(fix == "iso")[0]
+                            barostat_parameters["coupling_type"] = "isotropic"
                             np.fill_diagonal(coupling_constant, float(fix[i_baro + 3]))
                             np.fill_diagonal(reference_pressure, float(fix[i_baro + 2]))
                         else:
-                            barostat_parameters['coupling_type'] = 'anisotropic'
-                        if 'x' in fix:
-                            i_baro = np.where(fix == 'x')[0]
+                            barostat_parameters["coupling_type"] = "anisotropic"
+                        if "x" in fix:
+                            i_baro = np.where(fix == "x")[0]
                             coupling_constant[0, 0] = float(fix[i_baro + 3])
                             reference_pressure[0, 0] = float(fix[i_baro + 2])
-                        if 'y' in fix:
-                            i_baro = np.where(fix == 'y')[0]
+                        if "y" in fix:
+                            i_baro = np.where(fix == "y")[0]
                             coupling_constant[1, 1] = float(fix[i_baro + 3])
                             reference_pressure[1, 1] = float(fix[i_baro + 2])
-                        if 'z' in fix:
-                            i_baro = np.where(fix == 'z')[0]
+                        if "z" in fix:
+                            i_baro = np.where(fix == "z")[0]
                             coupling_constant[2, 2] = float(fix[i_baro + 3])
                             reference_pressure[2, 2] = float(fix[i_baro + 2])
-                        if 'xy' in fix:
-                            i_baro = np.where(fix == 'xy')[0]
+                        if "xy" in fix:
+                            i_baro = np.where(fix == "xy")[0]
                             coupling_constant[0, 1] = float(fix[i_baro + 3])
                             coupling_constant[1, 0] = float(fix[i_baro + 3])
                             reference_pressure[0, 1] = float(fix[i_baro + 2])
                             reference_pressure[1, 0] = float(fix[i_baro + 2])
-                        if 'yz' in fix:
-                            i_baro = np.where(fix == 'yz')[0]
+                        if "yz" in fix:
+                            i_baro = np.where(fix == "yz")[0]
                             coupling_constant[1, 2] = float(fix[i_baro + 3])
                             coupling_constant[2, 1] = float(fix[i_baro + 3])
                             reference_pressure[1, 2] = float(fix[i_baro + 2])
                             reference_pressure[2, 1] = float(fix[i_baro + 2])
-                        if 'xz' in fix:
-                            i_baro = np.where(fix == 'xz')[0]
+                        if "xz" in fix:
+                            i_baro = np.where(fix == "xz")[0]
                             coupling_constant[0, 3] = float(fix[i_baro + 3])
                             coupling_constant[3, 0] = float(fix[i_baro + 3])
                             reference_pressure[0, 3] = float(fix[i_baro + 2])
                             reference_pressure[3, 0] = float(fix[i_baro + 2])
-                        barostat_parameters['reference_pressure'] = reference_pressure * pressure_conversion  # stop pressure
-                        barostat_parameters['coupling_constant'] = coupling_constant * integration_timestep
-                        barostat_parameters['compressibility'] = compressibility
-
-                    if fix_style == 'press/berendsen':
-                        barostat_type = 'berendsen'
-                        if 'iso' in fix:
-                            i_baro = np.where(fix == 'iso')[0]
-                            barostat_parameters['coupling_type'] = 'isotropic'
+                        barostat_parameters["reference_pressure"] = (
+                            reference_pressure * pressure_conversion
+                        )  # stop pressure
+                        barostat_parameters["coupling_constant"] = (
+                            coupling_constant * integration_timestep
+                        )
+                        barostat_parameters["compressibility"] = compressibility
+
+                    if fix_style == "press/berendsen":
+                        barostat_type = "berendsen"
+                        if "iso" in fix:
+                            i_baro = np.where(fix == "iso")[0]
+                            barostat_parameters["coupling_type"] = "isotropic"
                             np.fill_diagonal(coupling_constant, float(fix[i_baro + 3]))
-                        elif 'aniso' in fix:
-                            i_baro = np.where(fix == 'aniso')[0]
-                            barostat_parameters['coupling_type'] = 'anisotropic'
-                            coupling_constant[:3] += 1.
+                        elif "aniso" in fix:
+                            i_baro = np.where(fix == "aniso")[0]
+                            barostat_parameters["coupling_type"] = "anisotropic"
+                            coupling_constant[:3] += 1.0
                             coupling_constant[:3] *= float(fix[i_baro + 3])
                         else:
-                            barostat_parameters['coupling_type'] = 'anisotropic'
-                        if 'x' in fix:
-                            i_baro = np.where(fix == 'x')[0]
+                            barostat_parameters["coupling_type"] = "anisotropic"
+                        if "x" in fix:
+                            i_baro = np.where(fix == "x")[0]
                             coupling_constant[0] = float(fix[i_baro + 3])
-                        if 'y' in fix:
-                            i_baro = np.where(fix == 'y')[0]
+                        if "y" in fix:
+                            i_baro = np.where(fix == "y")[0]
                             coupling_constant[1] = float(fix[i_baro + 3])
-                        if 'z' in fix:
-                            i_baro = np.where(fix == 'z')[0]
+                        if "z" in fix:
+                            i_baro = np.where(fix == "z")[0]
                             coupling_constant[2] = float(fix[i_baro + 3])
-                        if 'couple' in fix:
-                            i_baro = np.where(fix == 'couple')[0]
+                        if "couple" in fix:
+                            i_baro = np.where(fix == "couple")[0]
                             couple = fix[i_baro]
-                            if couple == 'xyz':
-                                barostat_parameters['coupling_type'] = 'isotropic'
-                            elif couple == 'xy' or couple == 'yz' or couple == 'xz':
-                                barostat_parameters['coupling_type'] = 'anisotropic'
-                        barostat_parameters['reference_pressure'] = float(fix[i_baro + 2]) * pressure_conversion  # stop pressure
-                        barostat_parameters['coupling_constant'] = np.ones(shape=(3, 3)) * float(fix[i_baro + 3]) * integration_timestep
-                    barostat_parameters['barostat_type'] = barostat_type
+                            if couple == "xyz":
+                                barostat_parameters["coupling_type"] = "isotropic"
+                            elif couple == "xy" or couple == "yz" or couple == "xz":
+                                barostat_parameters["coupling_type"] = "anisotropic"
+                        barostat_parameters["reference_pressure"] = (
+                            float(fix[i_baro + 2]) * pressure_conversion
+                        )  # stop pressure
+                        barostat_parameters["coupling_constant"] = (
+                            np.ones(shape=(3, 3))
+                            * float(fix[i_baro + 3])
+                            * integration_timestep
+                        )
+                    barostat_parameters["barostat_type"] = barostat_type
 
             if thermostat_parameters:
-                method['thermodynamic_ensemble'] = 'NPT' if barostat_type == 'nose_hoover' else 'NVT'
-            elif barostat_type == 'nose_hoover':
-                method['thermodynamic_ensemble'] = 'NPH'
+                method["thermodynamic_ensemble"] = (
+                    "NPT" if barostat_type == "nose_hoover" else "NVT"
+                )
+            elif barostat_type == "nose_hoover":
+                method["thermodynamic_ensemble"] = "NPH"
             else:
-                method['thermodynamic_ensemble'] = 'NVE'
+                method["thermodynamic_ensemble"] = "NVE"
 
-            method['thermostat_parameters'] = thermostat_parameters
-            method['barostat_parameters'] = barostat_parameters
+            method["thermostat_parameters"] = thermostat_parameters
+            method["barostat_parameters"] = barostat_parameters
 
             self.parse_md_workflow(dict(method=method, results=results))
 
     def parse_system(self):
         sec_run = self.archive.run[-1]
 
-        n_traj = self.traj_parsers.eval('n_frames')
+        n_traj = self.traj_parsers.eval("n_frames")
         if n_traj is None:
             return
 
-        self.n_atoms = [self.traj_parsers.eval('get_n_atoms', n) for n in range(n_traj)]
-        self.trajectory_steps = [step for n in range(n_traj) if (step := self.traj_parsers.eval('get_step', n)) is not None]
+        self.n_atoms = [self.traj_parsers.eval("get_n_atoms", n) for n in range(n_traj)]
+        self.trajectory_steps = [
+            step
+            for n in range(n_traj)
+            if (step := self.traj_parsers.eval("get_step", n)) is not None
+        ]
 
         units = self.log_parser.units
 
         def apply_unit(value, unit):
-            if not hasattr(value, 'units'):
+            if not hasattr(value, "units"):
                 value = value * units.get(unit, 1)
             return value
 
         def get_composition(children_names):
             children_count_tup = np.unique(children_names, return_counts=True)
-            formula = ''.join([f'{name}({count})' for name, count in zip(*children_count_tup)])
+            formula = "".join(
+                [f"{name}({count})" for name, count in zip(*children_count_tup)]
+            )
             return formula
 
         for step in self.trajectory_steps:
             traj_n = self._trajectory_steps.index(step)
-            lattice_vectors = self.traj_parsers.eval('get_lattice_vectors', traj_n)
+            lattice_vectors = self.traj_parsers.eval("get_lattice_vectors", traj_n)
             if lattice_vectors is not None:
-                lattice_vectors = apply_unit(lattice_vectors, 'distance')
-            velocities = self.traj_parsers.eval('get_velocities', traj_n)
+                lattice_vectors = apply_unit(lattice_vectors, "distance")
+            velocities = self.traj_parsers.eval("get_velocities", traj_n)
             if velocities is not None:
-                velocities = apply_unit(velocities, 'velocity')
+                velocities = apply_unit(velocities, "velocity")
             bond_list = []
             if traj_n == 0:  # TODO add references to the bond list for other steps
-                bond_list = get_bond_list_from_model_contributions(sec_run, method_index=-1, model_index=-1)
-            self.parse_trajectory_step({
-                'atoms': {
-                    'n_atoms': self.traj_parsers.eval('get_n_atoms', traj_n),
-                    'lattice_vectors': lattice_vectors,
-                    'periodic': self.traj_parsers.eval('get_pbc', traj_n),
-                    'positions': apply_unit(self.traj_parsers.eval('get_positions', traj_n), 'distance'),
-                    'labels': self.traj_parsers.eval('get_atom_labels', traj_n),
-                    'velocities': velocities,
-                    'bond_list': bond_list
+                bond_list = get_bond_list_from_model_contributions(
+                    sec_run, method_index=-1, model_index=-1
+                )
+            self.parse_trajectory_step(
+                {
+                    "atoms": {
+                        "n_atoms": self.traj_parsers.eval("get_n_atoms", traj_n),
+                        "lattice_vectors": lattice_vectors,
+                        "periodic": self.traj_parsers.eval("get_pbc", traj_n),
+                        "positions": apply_unit(
+                            self.traj_parsers.eval("get_positions", traj_n), "distance"
+                        ),
+                        "labels": self.traj_parsers.eval("get_atom_labels", traj_n),
+                        "velocities": velocities,
+                        "bond_list": bond_list,
+                    }
                 }
-            })
+            )
 
         if not sec_run.system:
             return
 
         sec_system = sec_run.system[-1]
         # parse atomsgroup (moltypes --> molecules --> residues)
-        atoms_info = self._mdanalysistraj_parser.get('atoms_info', None)
+        atoms_info = self._mdanalysistraj_parser.get("atoms_info", None)
         if atoms_info is None:
-            atoms_info = self.traj_parsers.eval('atoms_info')
+            atoms_info = self.traj_parsers.eval("atoms_info")
             if isinstance(atoms_info, list):
-                atoms_info = atoms_info[0] if atoms_info else None  # using info from the initial frame
+                atoms_info = (
+                    atoms_info[0] if atoms_info else None
+                )  # using info from the initial frame
         if atoms_info is not None:
-            atoms_moltypes = np.array(atoms_info.get('moltypes', []))
-            atoms_molnums = np.array(atoms_info.get('molnums', []))
-            atoms_resids = np.array(atoms_info.get('resids', []))
-            atoms_elements = np.array(atoms_info.get('elements', ['X'] * self.n_atoms))
-            atoms_types = np.array(atoms_info.get('types', []))
-            atom_labels = sec_system.atoms.get('labels')
-            if 'X' in atoms_elements:
-                atoms_elements = np.array(atom_labels) if atom_labels and 'X' not in atom_labels else atoms_types
-            atoms_resnames = np.array(atoms_info.get('resnames', []))
+            atoms_moltypes = np.array(atoms_info.get("moltypes", []))
+            atoms_molnums = np.array(atoms_info.get("molnums", []))
+            atoms_resids = np.array(atoms_info.get("resids", []))
+            atoms_elements = np.array(atoms_info.get("elements", ["X"] * self.n_atoms))
+            atoms_types = np.array(atoms_info.get("types", []))
+            atom_labels = sec_system.atoms.get("labels")
+            if "X" in atoms_elements:
+                atoms_elements = (
+                    np.array(atom_labels)
+                    if atom_labels and "X" not in atom_labels
+                    else atoms_types
+                )
+            atoms_resnames = np.array(atoms_info.get("resnames", []))
             moltypes = np.unique(atoms_moltypes)
             for i_moltype, moltype in enumerate(moltypes):
                 # Only add atomsgroup for initial system for now
                 sec_molecule_group = sec_run.system[0].m_create(AtomsGroup)
-                sec_molecule_group.label = f'group_{moltype}'
-                sec_molecule_group.type = 'molecule_group'
+                sec_molecule_group.label = f"group_{moltype}"
+                sec_molecule_group.type = "molecule_group"
                 sec_molecule_group.index = i_moltype
                 sec_molecule_group.atom_indices = np.where(atoms_moltypes == moltype)[0]
                 sec_molecule_group.n_atoms = len(sec_molecule_group.atom_indices)
@@ -1007,18 +1420,22 @@ def get_composition(children_names):
                 # mol_nums is the molecule identifier for each atom
                 mol_nums = atoms_molnums[sec_molecule_group.atom_indices]
                 moltype_count = np.unique(mol_nums).shape[0]
-                sec_molecule_group.composition_formula = f'{moltype}({moltype_count})'
+                sec_molecule_group.composition_formula = f"{moltype}({moltype_count})"
 
                 molecules = atoms_molnums
-                for i_molecule, molecule in enumerate(np.unique(molecules[sec_molecule_group.atom_indices])):
+                for i_molecule, molecule in enumerate(
+                    np.unique(molecules[sec_molecule_group.atom_indices])
+                ):
                     sec_molecule = sec_molecule_group.m_create(AtomsGroup)
                     sec_molecule.index = i_molecule
                     sec_molecule.atom_indices = np.where(molecules == molecule)[0]
                     sec_molecule.n_atoms = len(sec_molecule.atom_indices)
                     # use first particle to get the moltype
                     # not sure why but this value is being cast to int, cast back to str
-                    sec_molecule.label = str(atoms_moltypes[sec_molecule.atom_indices[0]])
-                    sec_molecule.type = 'molecule'
+                    sec_molecule.label = str(
+                        atoms_moltypes[sec_molecule.atom_indices[0]]
+                    )
+                    sec_molecule.type = "molecule"
                     sec_molecule.is_molecule = True
 
                     mol_resids = np.unique(atoms_resids[sec_molecule.atom_indices])
@@ -1032,27 +1449,39 @@ def get_composition(children_names):
                         for i_restype, restype in enumerate(restypes):
                             sec_monomer_group = sec_molecule.m_create(AtomsGroup)
                             restype_indices = np.where(atoms_resnames == restype)[0]
-                            sec_monomer_group.label = f'group_{restype}'
-                            sec_monomer_group.type = 'monomer_group'
+                            sec_monomer_group.label = f"group_{restype}"
+                            sec_monomer_group.type = "monomer_group"
                             sec_monomer_group.index = i_restype
-                            sec_monomer_group.atom_indices = np.intersect1d(restype_indices, sec_molecule.atom_indices)
-                            sec_monomer_group.n_atoms = len(sec_monomer_group.atom_indices)
+                            sec_monomer_group.atom_indices = np.intersect1d(
+                                restype_indices, sec_molecule.atom_indices
+                            )
+                            sec_monomer_group.n_atoms = len(
+                                sec_monomer_group.atom_indices
+                            )
                             sec_monomer_group.is_molecule = False
 
-                            restype_resids = np.unique(atoms_resids[sec_monomer_group.atom_indices])
+                            restype_resids = np.unique(
+                                atoms_resids[sec_monomer_group.atom_indices]
+                            )
                             restype_count = restype_resids.shape[0]
-                            sec_monomer_group.composition_formula = f'{restype}({restype_count})'
+                            sec_monomer_group.composition_formula = (
+                                f"{restype}({restype_count})"
+                            )
                             for i_res, res_id in enumerate(restype_resids):
                                 sec_residue = sec_monomer_group.m_create(AtomsGroup)
                                 sec_residue.index = i_res
                                 atom_indices = np.where(atoms_resids == res_id)[0]
-                                sec_residue.atom_indices = np.intersect1d(atom_indices, sec_monomer_group.atom_indices)
+                                sec_residue.atom_indices = np.intersect1d(
+                                    atom_indices, sec_monomer_group.atom_indices
+                                )
                                 sec_residue.n_atoms = len(sec_residue.atom_indices)
                                 sec_residue.label = str(restype)
-                                sec_residue.type = 'monomer'
+                                sec_residue.type = "monomer"
                                 sec_residue.is_molecule = False
                                 elements = atoms_elements[sec_residue.atom_indices]
-                                sec_residue.composition_formula = get_composition(elements)
+                                sec_residue.composition_formula = get_composition(
+                                    elements
+                                )
 
                         names = atoms_resnames[sec_molecule.atom_indices]
                         ids = atoms_resids[sec_molecule.atom_indices]
@@ -1063,7 +1492,9 @@ def get_composition(children_names):
                         # add the 0th index manually
                         ids_firstatom = np.insert(ids_firstatom, 0, 0)
                         names_firstatom = names[ids_firstatom]
-                        sec_molecule.composition_formula = get_composition(names_firstatom)
+                        sec_molecule.composition_formula = get_composition(
+                            names_firstatom
+                        )
 
     def parse_method(self):
         sec_run = self.archive.run[-1]
@@ -1071,7 +1502,7 @@ def parse_method(self):
         if self.traj_parsers[0].mainfile is None or self.data_parser.mainfile is None:
             return
 
-        if self.traj_parsers.eval('n_frames') is None:
+        if self.traj_parsers.eval("n_frames") is None:
             return
 
         sec_method = sec_run.m_create(Method)
@@ -1079,20 +1510,20 @@ def parse_method(self):
         sec_model = sec_force_field.m_create(Model)
 
         # Old parsing of method with text parser
-        masses = self.data_parser.get('Masses', None)
+        masses = self.data_parser.get("Masses", None)
         self.traj_parsers[0].masses = masses
         # @Landinesa: we should be able to set the atom masses with the TrajParser, but I don't quite understand how to use this.
         # Can you add the implementation here, and then we can make the MDA implementation below as a backup?
         # Can you also get the charges somehow?
 
         # parse method with MDAnalysis (should be a backup for the charges and masses...but the interactions are most easily read from the MDA universe right now)
-        n_atoms = self.traj_parsers.eval('get_n_atoms', 0)
+        n_atoms = self.traj_parsers.eval("get_n_atoms", 0)
         if n_atoms is not None:
-            atoms_info = self._mdanalysistraj_parser.get('atoms_info', None)
+            atoms_info = self._mdanalysistraj_parser.get("atoms_info", None)
             for n in range(n_atoms):
                 sec_atom = sec_method.m_create(AtomParameters)
-                sec_atom.charge = atoms_info.get('charges', [None] * (n + 1))[n]
-                sec_atom.mass = atoms_info.get('masses', [None] * (n + 1))[n]
+                sec_atom.charge = atoms_info.get("charges", [None] * (n + 1))[n]
+                sec_atom.mass = atoms_info.get("masses", [None] * (n + 1))[n]
 
         # TODO address case types are numbered instead of giving atom labels (fix tests accordingly)
         interactions = self._mdanalysistraj_parser.get_interactions()
@@ -1100,42 +1531,52 @@ def parse_method(self):
 
         # Force Calculation Parameters
         sec_force_calculations = sec_force_field.m_create(ForceCalculations)
-        for pairstyle in self.log_parser.get('pair_style', []):
+        for pairstyle in self.log_parser.get("pair_style", []):
             pairstyle_args = pairstyle[1:]
             pairstyle = pairstyle[0].lower()
-            if 'lj' in pairstyle and 'coul' not in pairstyle:  # only cover the simplest case
-                sec_force_calculations.vdw_cutoff = float(pairstyle_args[-1]) * ureg.nanometer
-            if 'coul' in pairstyle:
-                if 'streitz' in pairstyle:
+            if (
+                "lj" in pairstyle and "coul" not in pairstyle
+            ):  # only cover the simplest case
+                sec_force_calculations.vdw_cutoff = (
+                    float(pairstyle_args[-1]) * ureg.nanometer
+                )
+            if "coul" in pairstyle:
+                if "streitz" in pairstyle:
                     cutoff = float(pairstyle_args[0])
                 else:
                     cutoff = float(pairstyle_args[-1])
                 sec_force_calculations.coulomb_cutoff = cutoff * ureg.nanometer
-            val = self.log_parser.get('kspace_style', None)
+            val = self.log_parser.get("kspace_style", None)
             if val is not None:
                 kspacestyle = val[0][0].lower()
-                if 'ewald' in kspacestyle:
-                    sec_force_calculations.coulomb_type = 'ewald'
-                elif 'pppm' in kspacestyle:
-                    sec_force_calculations.coulomb_type = 'particle_particle_particle_mesh'
-                elif 'msm' in kspacestyle:
-                    sec_force_calculations.coulomb_type = 'multilevel_summation'
+                if "ewald" in kspacestyle:
+                    sec_force_calculations.coulomb_type = "ewald"
+                elif "pppm" in kspacestyle:
+                    sec_force_calculations.coulomb_type = (
+                        "particle_particle_particle_mesh"
+                    )
+                elif "msm" in kspacestyle:
+                    sec_force_calculations.coulomb_type = "multilevel_summation"
 
         sec_neighbor_searching = sec_force_calculations.m_create(NeighborSearching)
-        val = self.log_parser.get('neighbor', None)
+        val = self.log_parser.get("neighbor", None)
         if val is not None:
             neighbor = val[0][0]  # just use the first instance for now
             vdw_cutoff = sec_force_calculations.vdw_cutoff
             if vdw_cutoff is not None:
-                sec_neighbor_searching.neighbor_update_cutoff = float(neighbor) * ureg.nanometer
+                sec_neighbor_searching.neighbor_update_cutoff = (
+                    float(neighbor) * ureg.nanometer
+                )
                 sec_neighbor_searching.neighbor_update_cutoff += vdw_cutoff
-        val = self.log_parser.get('neigh_modify', None)
+        val = self.log_parser.get("neigh_modify", None)
         if val is not None:
             neighmodify = val[0]  # just use the first instace for now
             neighmodify = np.array([str(i).lower() for i in neighmodify])
-            if 'every' in neighmodify:
-                index = np.where(neighmodify == 'every')[0]
-                sec_neighbor_searching.neighbor_update_frequency = int(neighmodify[index + 1])
+            if "every" in neighmodify:
+                index = np.where(neighmodify == "every")[0]
+                sec_neighbor_searching.neighbor_update_frequency = int(
+                    neighmodify[index + 1]
+                )
 
     def parse_input(self):
         sec_run = self.archive.run[-1]
@@ -1143,11 +1584,13 @@ def parse_input(self):
 
         if self.data_parser.mainfile is not None:
             sec_input_output_files.x_lammps_inout_file_data = os.path.basename(
-                self.data_parser.mainfile)
+                self.data_parser.mainfile
+            )
 
         if self.traj_parsers[0].mainfile is not None:
             sec_input_output_files.x_lammps_inout_file_trajectory = os.path.basename(
-                self.traj_parsers[0].mainfile)
+                self.traj_parsers[0].mainfile
+            )
 
         sec_control_parameters = sec_run.m_create(x_lammps_section_control_parameters)
         keys = self.log_parser._commands
@@ -1156,10 +1599,13 @@ def parse_input(self):
             if val is None:
                 continue
             val = val[0] if len(val) == 1 else val
-            key = 'x_lammps_inout_control_%s' % key.replace('_', '').replace('/', '').lower()
+            key = (
+                "x_lammps_inout_control_%s"
+                % key.replace("_", "").replace("/", "").lower()
+            )
             if hasattr(sec_control_parameters, key):
                 if isinstance(val, list):
-                    val = ' '.join([str(v) for v in val])
+                    val = " ".join([str(v) for v in val])
                 setattr(sec_control_parameters, key, str(val))
 
     def init_parser(self):
@@ -1185,48 +1631,63 @@ def parse(self, filepath, archive, logger):
 
         # parse basic
         sec_run.program = Program(
-            name='LAMMPS', version=self.log_parser.get('program_version', ''))
+            name="LAMMPS", version=self.log_parser.get("program_version", "")
+        )
 
         # parse data file associated with calculation
         data_files = self.log_parser.get_data_files()
         if len(data_files) > 1:
-            self.logger.warning('Multiple data files are specified')
+            self.logger.warning("Multiple data files are specified")
         if data_files:
             self.data_parser.mainfile = data_files[0]
 
         # parse trajectorty file associated with calculation
         traj_files = self.log_parser.get_traj_files()
         if len(traj_files) > 1:
-            self.logger.warning('Multiple traj files are specified')
+            self.logger.warning("Multiple traj files are specified")
 
         parsers = []
         for n, traj_file in enumerate(traj_files):
             # parser initialization for each traj file cannot be avoided as there are
             # cases where traj files can share the same parser
-            file_type = self.log_parser.get('dump', [[1, 'all', traj_file[-3:]]] * (n + 1))[n][2]
-            if file_type == 'dcd' and data_files:
-                traj_parser = MDAnalysisParser(topology_format='DATA', format='DCD')
+            file_type = self.log_parser.get(
+                "dump", [[1, "all", traj_file[-3:]]] * (n + 1)
+            )[n][2]
+            if file_type == "dcd" and data_files:
+                traj_parser = MDAnalysisParser(topology_format="DATA", format="DCD")
                 traj_parser.mainfile = data_files[0]
                 traj_parser.auxilliary_files = [traj_file]
                 self._mdanalysistraj_parser = traj_parser
-            elif file_type == 'xyz' and data_files:
-                traj_parser = MDAnalysisParser(topology_format='DATA', format='XYZ')
+            elif file_type == "xyz" and data_files:
+                traj_parser = MDAnalysisParser(topology_format="DATA", format="XYZ")
                 traj_parser.mainfile = data_files[0]
                 traj_parser.auxilliary_files = [traj_file]
                 self._mdanalysistraj_parser = traj_parser
-            elif file_type == 'custom' and data_files:
-                custom_options = self.log_parser.get('dump')[n][5:]
-                custom_options = [option.replace('xu', 'x') for option in custom_options]
-                custom_options = [option.replace('yu', 'y') for option in custom_options]
-                custom_options = [option.replace('zu', 'z') for option in custom_options]
-                custom_options = ' '.join(custom_options)
-                traj_parser = MDAnalysisParser(topology_format='DATA', format='LAMMPSDUMP', atom_style=custom_options)
+            elif file_type == "custom" and data_files:
+                custom_options = self.log_parser.get("dump")[n][5:]
+                custom_options = [
+                    option.replace("xu", "x") for option in custom_options
+                ]
+                custom_options = [
+                    option.replace("yu", "y") for option in custom_options
+                ]
+                custom_options = [
+                    option.replace("zu", "z") for option in custom_options
+                ]
+                custom_options = " ".join(custom_options)
+                traj_parser = MDAnalysisParser(
+                    topology_format="DATA",
+                    format="LAMMPSDUMP",
+                    atom_style=custom_options,
+                )
                 if data_files:
                     traj_parser.mainfile = data_files[0]
                 traj_parser.auxilliary_files = [traj_file]
                 # try to check if MDAnalysis can construct the universe or at least parse
                 # the atoms, otherwise will fall back to TrajParser
-                if traj_parser.universe is None or 'X' in traj_parser.get('atoms_info', {}).get('names', []):
+                if traj_parser.universe is None or "X" in traj_parser.get(
+                    "atoms_info", {}
+                ).get("names", []):
                     # mda necessary to calculate rdf and atomsgroup
                     if n == 0:
                         self._mdanalysistraj_parser = traj_parser
@@ -1243,9 +1704,10 @@ def parse(self, filepath, archive, logger):
             return
 
         # parse data from auxiliary log file
-        if self.log_parser.get('log') is not None:
+        if self.log_parser.get("log") is not None:
             self.aux_log_parser.mainfile = os.path.join(
-                self.log_parser.maindir, self.log_parser.get('log')[0])
+                self.log_parser.maindir, self.log_parser.get("log")[0]
+            )
             # we assign units here which is read from log parser
             self.aux_log_parser._units = self.log_parser.units