Source code for irradiapy.io.lammpslogreader

"""Class to read LAMMPS log files."""

import re
from collections import defaultdict
from dataclasses import dataclass, field
from pathlib import Path
from typing import Any, Generator

import numpy as np
from numpy import typing as npt



[docs]
@dataclass
class LAMMPSLogReader:
    """Class to read LAMMPS log files.

    Parameters
    ----------
    log_path : Path
        The path to the LAMMPS log file.

    Yields
    -------
    Generator[dict[str, Any], None, None]
        A dictionary containing the thermo data.

    Note
    ----
    This generator yields a dictionary with a single key for the thermo data,
    this ensures compatibility if this reader is extended to read more data in the future.
    """

    log_path: Path
    data: dict = field(default_factory=lambda: {"thermo": None}, init=False)
    thermo: npt.NDArray[np.float64] = field(
        default_factory=lambda: np.empty(0, dtype=np.dtype([])), init=False
    )

    def __iter__(self) -> Generator[dict[str, Any], None, None]:
        """Reads a LAMMPS log file.

        Yields
        ------
        dict[str, Any]
            Snapshot data containing the thermo array.
        """
        self.__reset()
        expecting_header = False  # Next line will be a header
        expecting_data = False  # Next lines will be data
        for line in open(self.log_path, "r", encoding="utf-8"):
            if line.startswith("Per MPI "):
                expecting_header = True
                self.__reset()
                continue
            elif line.startswith("Loop time") or line.startswith("Fix halt"):
                if self.thermo.size > 0:
                    self.__fill()
                    yield self.data
                expecting_header = False
                expecting_data = False
                self.__reset()
                continue
            if expecting_header:
                items = line.split()
                types = [np.float64] * len(items)
                if "Step" in items:
                    types[items.index("Step")] = np.int64
                dtype = np.dtype(list(zip(items, types)))
                self.thermo = np.empty(0, dtype=dtype)
                expecting_header = False
                expecting_data = True
                continue
            if expecting_data:
                if line.startswith("WARNING"):
                    continue
                row = np.array(tuple(map(float, line.split())), dtype=dtype)
                self.thermo = np.append(self.thermo, row)

    def __reset(self) -> None:
        """Reset the internal state of the reader."""
        self.thermo = np.empty(0, dtype=np.dtype([]))
        self.data = {"thermo": self.thermo}

    def __fill(self) -> None:
        """Fill the data dictionary with data."""
        self.data["thermo"] = self.thermo


[docs]
    def get_pka_data(self) -> defaultdict:
        """Extract PKA data if exists."""

        data = defaultdict(None)

        # Patterns to capture numbers and tuples
        float_pat = re.compile(r"[-+]?(?:\d+(?:\.\d*)?|\.\d+)(?:[eE][-+]?\d+)?")
        tuple_pat = re.compile(r"\(([^)]*)\)")

        def first_float(s: str) -> float | None:
            m = float_pat.search(s)
            return float(m.group()) if m else None

        with open(self.path_log, "r", encoding="utf-8") as file:
            for raw in file:
                line = raw.lstrip()  # normalize leading spaces
                if line.startswith("ID:"):
                    data["id"] = int(line.split(":", 1)[1].strip())
                elif line.startswith("Element:"):
                    data["element"] = int(line.split(":", 1)[1].strip())
                elif line.startswith("Position:"):
                    m = tuple_pat.search(line)
                    if m:
                        data["pos"] = np.array(
                            [float(x) for x in float_pat.findall(m.group(1))]
                        )
                elif line.startswith("Energy:"):
                    data["energy"] = first_float(line)
                elif line.startswith("Speed:"):
                    data["speed"] = first_float(line)
                elif line.startswith("Velocity:"):
                    m = tuple_pat.search(line)
                    if m:
                        data["vel"] = np.array(
                            [float(x) for x in float_pat.findall(m.group(1))]
                        )
                elif line.startswith("Polar angle (theta):"):
                    data["polar"] = first_float(line)
                elif line.startswith("Azimuthal angle (phi):"):
                    data["azimuthal"] = first_float(line)

        return data