Source code for pyretis.testing.simulation_comparison

# Copyright (c) 2026, PyRETIS Development Team.
# Distributed under the LGPLv2.1+ License. See LICENSE for more info.
"""Methods for comparing simulation results.

This module defines methods that can be used for comparing results
from different simulations, such as output files, reports, and
path ensembles.
"""
import math
import os
import filecmp
import numpy as np
from pyretis.testing.helpers import search_for_files
from pyretis.inout.formats.energy import EnergyPathFile
from pyretis.inout.formats.order import OrderPathFile
from pyretis.inout.formats.path import PathExtFile
from pyretis.inout.formats.cross import CrossFile


# Names of the expected output files in archive directories:
ARCHIVE_FILES = {'energy.txt', 'order.txt', 'traj.txt'}
# Names of other expected output files:
OUTPUT_FILES = {'energy.txt', 'order.txt', 'pathensemble.txt'}
# Define readers for loading data:
READERS = {
    'energy': EnergyPathFile,
    'order': OrderPathFile,
    'traj': PathExtFile,
}


[docs]def read_files(*files, read_comments=True):
    """Read files into memory.

    Here, we assume that we are given small files and that we
    can read these into memory.

    Parameters
    ----------
    files : tuple of str
        These are the paths to the files we are to read.
    read_comments : bool, optional
        If False, we skip lines starting with a "#".

    Returns
    -------
    all_data : list of list of str
        The data read from the different files.
    """
    all_data = []
    for filename in files:
        data = []
        with open(filename, 'r', encoding="utf8") as infile:
            for line in infile:
                if not read_comments and line.strip().startswith('#'):
                    continue
                data.append(line)
        all_data.append(data)
    return all_data


[docs]def compare_text_line_by_line(file1, file2, skip=None, skip_keys=None):
    """Compare two files, line by line.

    Parameters
    ----------
    file1 : str
        The path to the first file to compare.
    file2 : str
        The path to the second file to compare.
    skip : list of int, optional
        These are 0-indexed line numbers we are to skip.
    skip_keys : list of str, optional
        Lines whose first token matches any key in this list are filtered
        out from both files before comparison. Useful for ignoring settings
        like ``exe_path`` that differ by run directory.

    Returns
    -------
    equal : bool
        True if the files are deemed to be equal.
    msg : str
        A descriptive message of the result of the comparison.
    """
    all_data = read_files(file1, file2, read_comments=True)
    if skip_keys:
        def keep(line):
            """Return True if line should be kept."""
            token = line.split()[0] if line.split() else ''
            return token not in skip_keys
        data1 = [line for line in all_data[0] if keep(line)]
        data2 = [line for line in all_data[1] if keep(line)]
    else:
        data1, data2 = all_data[0], all_data[1]
    if len(data1) != len(data2):
        return False, 'The number of lines in the files differ'
    for i, (lini, linj) in enumerate(zip(data1, data2)):
        if skip and i in skip:
            continue
        if not lini.rstrip('\n') == linj.rstrip('\n'):
            return False, f'Line {i} differs: {lini.strip()} != {linj.strip()}'

    return True, 'Files are equal'


[docs]def _compare_block_comments(comment1, comment2):
    """Compare two block comment lists, tolerating 1-ULP float differences.

    Parameters
    ----------
    comment1 : list of str
        Comment lines from the first file block.
    comment2 : list of str
        Comment lines from the second file block.

    Returns
    -------
    bool
        True if the comments are considered equal.
    """
    if len(comment1) != len(comment2):
        return False
    for c1, c2 in zip(comment1, comment2):
        if c1 == c2:
            continue
        t1, t2 = c1.split(), c2.split()
        if len(t1) != len(t2):
            return False
        for tok1, tok2 in zip(t1, t2):
            if tok1 == tok2:
                continue
            stripped1 = tok1.strip("(),';")
            stripped2 = tok2.strip("(),';")
            try:
                if not math.isclose(float(stripped1), float(stripped2),
                                    rel_tol=1e-9):
                    return False
            except ValueError:
                return False
    return True


[docs]def compare_data_by_columns(file1, file2, file_type, skip=None):
    """Compare two output PyRETIS data files by columns.

    This method compares files where numbers are stored in columns
    and the columns have specific labels. Here, we also compare
    labels and comments.

    Parameters
    ----------
    file1 : str
        The path to the first file to compare.
    file2 : str
        The path to the second file to compare.
    file_type : str
        A string used to determine the file type (e.g., 'energy').
    skip : list of str, optional
        A list of items from the loaded data we are to skip.
        This can, for instance, be certain energy terms that are
        not absolute and can't easily be compared.

    Returns
    -------
    equal : bool
        True if the files are deemed to be equal.
    msg : str
        A descriptive message of the result of the comparison.
    """
    reader = READERS[file_type]
    # Materialise the readers: a run that produced no blocks (or fewer
    # than the reference) must NOT pass -- ``zip`` would silently
    # truncate to the shorter sequence and skip the missing blocks.
    data1 = list(reader(file1, 'r').load())
    data2 = list(reader(file2, 'r').load())
    if not data1 or not data2:
        return False, 'No data blocks to compare'
    if len(data1) != len(data2):
        return False, (f'Different number of blocks: '
                       f'{len(data1)} != {len(data2)}')
    for block1, block2 in zip(data1, data2):
        if block1['comment'] != block2['comment']:
            if not _compare_block_comments(block1['comment'],
                                           block2['comment']):
                return False, 'Block comment differs'
        if sorted(block1['data'].keys()) != sorted(block2['data'].keys()):
            return False, 'Different items in block data'
        for key, val in block1['data'].items():
            if skip and key in skip:
                continue
            arr1 = np.asarray(val)
            arr2 = np.asarray(block2['data'][key])
            if arr1.shape != arr2.shape:
                return False, f'Block term "{key}" shape differs'
            if arr1.size == 0:
                return False, f'Block term "{key}" is empty'
            nan1 = np.isnan(arr1)
            # Same rule as compare_numerical_data: NaN must match
            # positionally (else a divergence), and an all-NaN term
            # tests nothing. Partial matching NaN (loaded frames) is OK.
            if not np.array_equal(nan1, np.isnan(arr2)):
                return False, f'NaN positions differ in block term "{key}"'
            if nan1.all():
                return False, f'Block term "{key}" is entirely NaN'
            if not np.allclose(arr1, arr2, equal_nan=True):
                return False, 'Block terms differ'
    return True, 'Files are equal'


[docs]def compare_numerical_data(file1, file2, rel_tol=1e-5, skip_cols=None):
    """Compare two files containing numerical data.

    Here, we compare files that contain numerical data. We don't
    care about comments here, we just compare the actual numerical data.

    A meaningful comparison must not pass on degenerate input. This
    rejects empty data, shape mismatches, NaNs that sit at *different*
    positions in the two files (a divergence that turned a finite value
    into NaN or vice versa), and data/columns that are *entirely* NaN
    (which test nothing). Partial NaN at *matching* positions -- e.g.
    loaded (``ld``) frames that legitimately have no computed energy --
    is allowed; the finite values around them are still compared.
    Columns that are unavailable for an engine (e.g. a potential energy
    that engine never reports) must be excluded explicitly via
    ``skip_cols`` so the gap is visible rather than silently "equal".

    Parameters
    ----------
    file1 : str
        The path to the first file to compare.
    file2 : str
        The path to the second file to compare.
    rel_tol : float, optional
        Relative tolerance for the comparison.
    skip_cols : list of int, optional
        Column indices to exclude from the comparison (e.g. a column an
        engine does not populate). Excluding a column is explicit and
        visible, unlike letting NaN==NaN pass.

    Returns
    -------
    equal : bool
        True if the files are deemed to be equal.
    msg : str
        A descriptive message of the result of the comparison.
    """
    data1 = np.loadtxt(file1)
    data2 = np.loadtxt(file2)
    if data1.size == 0 or data2.size == 0:
        return False, 'Numerical data is empty'
    if data1.shape != data2.shape:
        return False, f'Shapes differ: {data1.shape} != {data2.shape}'
    if skip_cols and data1.ndim >= 2:
        keep = [c for c in range(data1.shape[1]) if c not in skip_cols]
        data1 = data1[:, keep]
        data2 = data2[:, keep]
        if data1.size == 0:
            return False, 'All columns were skipped'
    nan1 = np.isnan(data1)
    if not np.array_equal(nan1, np.isnan(data2)):
        return False, 'NaN positions differ'
    if data1.ndim >= 2:
        allnan = nan1.all(axis=0)
        if allnan.any():
            cols = np.where(allnan)[0].tolist()
            return False, f'Column(s) {cols} are entirely NaN'
    elif nan1.all():
        return False, 'All data is NaN'
    if not np.allclose(data1, data2, rtol=rel_tol, equal_nan=True):
        return False, 'Numerical data differ'
    return True, 'Files are equal'


[docs]def compare_energy_data(file1, file2, rel_tol=1e-5):
    """Compare two ``energy.txt`` files, tolerating unavailable terms.

    Energy files always carry a fixed set of columns (time, potential,
    kinetic, total, temperature), but not every engine or path populates
    all of them: paths loaded from disk carry no computed energy, and an
    engine may not report e.g. the total energy or the temperature. Such
    a term is written as an entirely-NaN column.

    This wraps :func:`compare_numerical_data` with energy-specific
    handling of those columns:

      - A column that is entirely NaN in *both* files carries nothing to
        compare; it is excluded (``compare_numerical_data`` by design
        rejects all-NaN input rather than letting NaN==NaN pass).
      - Every other column is compared normally. A column that is
        all-NaN in only *one* file (a run that suddenly computes -- or
        stops computing -- a term) therefore still fails, via the
        NaN-position check, rather than being silently skipped.

    Parameters
    ----------
    file1 : str
        The path to the first file to compare.
    file2 : str
        The path to the second file to compare.
    rel_tol : float, optional
        Relative tolerance forwarded to :func:`compare_numerical_data`.

    Returns
    -------
    equal : bool
        True if the files are deemed to be equal.
    msg : str
        A descriptive message of the result of the comparison.
    """
    data1 = np.loadtxt(file1)
    data2 = np.loadtxt(file2)
    if data1.size == 0 or data2.size == 0:
        return False, 'Numerical data is empty'
    if data1.ndim == 1:
        data1 = data1.reshape(1, -1)
    if data2.ndim == 1:
        data2 = data2.reshape(1, -1)
    if data1.shape != data2.shape:
        return False, f'Shapes differ: {data1.shape} != {data2.shape}'
    both_nan = np.isnan(data1).all(axis=0) & np.isnan(data2).all(axis=0)
    skip_cols = np.where(both_nan)[0].tolist()
    return compare_numerical_data(file1, file2, rel_tol=rel_tol,
                                  skip_cols=skip_cols or None)


[docs]def compare_numerical_mse(file1, file2, tol=1e-12):
    """Compare two numerical files using mean squared error.

    Parameters
    ----------
    file1 : str
        The path to the first file to compare.
    file2 : str
        The path to the second file to compare.
    tol : float, optional
        Tolerance for the mean squared error.

    Returns
    -------
    equal : bool
        True if the MSE is below the tolerance.
    msg : str
        A descriptive message with the MSE value.
    """
    data1 = np.loadtxt(file1)
    data2 = np.loadtxt(file2)
    if data1.shape != data2.shape:
        return False, f'Shapes differ: {data1.shape} != {data2.shape}'
    mse = np.mean((data1 - data2)**2)
    if mse > tol:
        return False, f'MSE {mse} > {tol}'
    return True, f'MSE {mse} is within tolerance'


[docs]def _read_file_lines(filepath):
    """Read all lines from a file."""
    with open(filepath, 'r', encoding='utf-8') as fhandle:
        return fhandle.readlines()


[docs]def compare_restarted_text_files(file11, file12, file2):
    """Check if file2 is equal to file11 + file12 minus one overlapping line.

    We handle headers (lines starting with '#') by skipping them in the
    second file part.

    Parameters
    ----------
    file11 : str
        Path to the first part of the restarted simulation output.
    file12 : str
        Path to the second part of the restarted simulation output.
    file2 : str
        Path to the full (continuous) simulation output.

    Returns
    -------
    equal : bool
        True if the files match the pattern.
    msg : str
        A descriptive message of the result.
    """
    f11_lines = _read_file_lines(file11)
    f12_lines = _read_file_lines(file12)
    f2_lines = _read_file_lines(file2)

    # Find first non-comment line in f12
    idx12 = 0
    while idx12 < len(f12_lines) and f12_lines[idx12].startswith('#'):
        idx12 += 1

    if idx12 >= len(f12_lines):
        return False, 'Part 2 of restarted file contains no data'

    # Check overlap: last line of part 1 must match first data line of part 2
    if (f11_lines[-1] if f11_lines else None) != f12_lines[idx12]:
        return False, 'Overlapping lines differ between part 1 and part 2'

    # Combined = Part 1 + Part 2 (skipping header and overlapping data line)
    combined = f11_lines + f12_lines[idx12 + 1:]

    if len(combined) != len(f2_lines):
        return (False,
                f'Line count mismatch: {len(combined)} != {len(f2_lines)}')

    for i, (l1, l2) in enumerate(zip(combined, f2_lines)):
        if l1 != l2:
            return False, f'Mismatch at line {i}'

    return True, 'Restarted files match the full simulation'


[docs]def compare_simulation_files(file1, file2, skip=None, mode='line'):
    """Top-level function to compare two simulation output files.

    Parameters
    ----------
    file1 : str
        The path to the first file to compare.
    file2 : str
        The path to the second file to compare.
    skip : list of str or list of int, optional
        A list of items that are to be skipped in the comparison.
    mode : str, optional
        A string used to determine how we do the comparison:
        'numerical' will select a comparison of numerical blocks;
        'line' will select a line-by-line text comparison;
        anything else will perform a literal file comparison.

    Returns
    -------
    equal : bool
        True if the files were found to be equal, False otherwise.
    msg : str
        A string with information about the comparison result.
    """
    if mode == 'numerical':
        return compare_numerical_data(file1, file2)
    if mode == 'line':
        return compare_text_line_by_line(file1, file2, skip=skip)
    equal = filecmp.cmp(file1, file2, shallow=False)
    msg = 'Files are equal' if equal else 'Files are not equal'
    return equal, msg


[docs]def compare_traj_archive(dir1, dir2):
    """Compare archived trajectories between two directories.

    These archives consist of trajectory information such as
    energies, order parameters and positions. Here, we verify that
    the output written by PyRETIS is identical in the two cases.

    Parameters
    ----------
    dir1 : str
        The path to the first directory to use in the comparison.
    dir2 : str
        The path to the second directory to use in the comparison.

    Returns
    -------
    errors : list of tuple
        This list contains the files which differed, if any.
    """
    errors = []
    files1 = sorted(search_for_files(dir1))
    files2 = sorted(search_for_files(dir2))
    # Are the number of files equal:
    if len(files1) != len(files2):
        errors.append((dir1, dir2))
        return errors
    # Compare the files that are written by PyRETIS:
    for file1, file2 in zip(files1, files2):
        basename1 = os.path.basename(file1)
        basename2 = os.path.basename(file2)
        if basename1 != basename2:
            errors.append((file1, file2))
            continue
        if basename1 in ARCHIVE_FILES:
            equal, _ = compare_simulation_files(file1, file2, mode='cmp')
            if not equal:
                errors.append((file1, file2))
    return errors


[docs]def compare_path_ensemble_data(file1, file2, rel_tol=1e-5, skip=None):
    """Compare two path ensemble files.

    We compare line-by-line, but skip comments and we check that
    numbers are close, as judged by the given relative tolarance.

    Parameters
    ----------
    file1 : str
        The path to the first file to consider in the comparison.
    file2 : str
        The path to the second file to consider in the comparison.
    rel_tol : float, optional
        A relative tolerance used to determine if numbers are equal.
    skip : list of int, optional
        These are columns we are to skip in the comparison.

    Returns
    -------
    equal : bool
        True if the files are equal, False otherwise.
    msg : str
        A message describing the result of the comparison.
    """
    all_data = read_files(file1, file2, read_comments=False)
    if not len(all_data[0]) == len(all_data[1]):
        return False, 'The number of lines in the files differ'
    # Two empty (comments-only) path-ensemble files would otherwise
    # pass the length check (0 == 0) and the per-row loop would never
    # run -- a simulation that recorded no MC moves must not be reported
    # as "equal" to a reference.
    if len(all_data[0]) == 0:
        return False, 'Path ensemble file has no data rows'
    # Define the expected data types for the columns in the path
    # ensemble files:
    data_types = {
        0: int, 1: int, 2: int, 3: str, 4: str, 5: str, 6: int, 7: str, 8: str,
        9: float, 10: float, 11: int, 12: int, 13: float, 14: int, 15: int,
    }
    for i, (line1, line2) in enumerate(zip(*all_data)):
        stuff1 = line1.split()
        stuff2 = line2.split()
        for col, func in data_types.items():
            if skip and col in skip:
                continue
            if func == str:
                check = func(stuff1[col]) == func(stuff2[col])
            else:
                check = math.isclose(
                    func(stuff1[col]), func(stuff2[col]), rel_tol=rel_tol
                )
            if not check:
                return False, f'Files differ on line {i}, column {col}'

    return True, 'Files are equal'


[docs]def compare_reports_normalized(fil1, fil2):
    """Compare two reports, normalizing common version/time differences.

    This function ignores Docutils version meta-data, timestamps, and
    common spelling variations (grey/gray) in CSS to remain robust against
    environment differences.

    Parameters
    ----------
    fil1 : str
        The path to the first report to compare.
    fil2 : str
        The path to the second report to compare.

    Returns
    -------
    equal : bool
        True if reports are essentially equal.
    msg : str
        Description of mismatch if found.
    """
    def get_clean_lines(filepath):
        """Read lines and skip non-essential content.

        Inline ``<style>`` blocks and ``<meta>`` tags are dropped because
        they reflect the local docutils version, not the analysis
        output. The XML declaration is also dropped for the same reason.
        """
        clean_lines = []
        in_style = False
        with open(filepath, 'r', encoding='utf-8') as infile:
            for line in infile:
                stripped = line.strip()
                # Skip <style>...</style> blocks entirely (docutils CSS).
                if in_style:
                    if '</style>' in line:
                        in_style = False
                    continue
                if stripped.startswith('<style'):
                    in_style = '</style>' not in line
                    continue
                # Skip XML declaration and meta tags (docutils-version).
                if stripped.startswith('<?xml '):
                    continue
                if stripped.startswith('<meta '):
                    continue
                # Skip timestamps
                if 'generated by PyRETIS' in line or \
                   (stripped.startswith('on ') and
                    (stripped.endswith('.') or
                     stripped.endswith('.</p>'))):
                    continue
                # Skip specific ID lines in CSS that might shift
                if ':Id: $Id: html4css1.css' in line:
                    continue
                # Normalize gray/grey for CSS
                line = line.replace('color: gray', 'color: grey')
                clean_lines.append(line)
        return clean_lines

    clean1 = get_clean_lines(fil1)
    clean2 = get_clean_lines(fil2)

    if len(clean1) != len(clean2):
        return False, 'Reports differ in number of contentful lines'

    for i, (l1, l2) in enumerate(zip(clean1, clean2)):
        if l1 != l2:
            return False, f'Mismatch at cleaned line {i}: {l1.strip()}'

    return True, 'Reports are essentially equal'


[docs]def compare_restarted_cross_files(file11, file12, file2):
    """Compare CrossFile data from a restarted simulation.

    Parameters
    ----------
    file11 : str
        Path to the first part of the crossing data.
    file12 : str
        Path to the second part of the crossing data.
    file2 : str
        Path to the full (continuous) crossing data.

    Returns
    -------
    equal : bool
        True if the crossing data matches.
    msg : str
        A descriptive message.
    """
    def load_flattened(fpath):
        blocks = list(CrossFile(fpath, 'r').load())
        flat_data = []
        for block in blocks:
            flat_data.extend(block['data'])
        return np.array(flat_data)

    data2 = load_flattened(file2)
    data11 = load_flattened(file11)
    data12 = load_flattened(file12)

    if data11.size > 0 and data12.size > 0:
        if np.array_equal(data11[-1], data12[0]):
            combined_data = np.vstack((data11, data12[1:]))
        else:
            combined_data = np.vstack((data11, data12))
    elif data11.size > 0:
        combined_data = data11
    else:
        combined_data = data12

    if combined_data.shape != data2.shape:
        msg = (f'Data shape mismatch: {combined_data.shape} != '
               f'{data2.shape}')
        return False, msg

    if not np.array_equal(combined_data, data2):
        return False, 'Crossing data mismatch'

    return True, 'Crossing data matches'