@article{SALOMON2026169809,
title = {mdxplain: Scalable Molecular Dynamics Analysis with Machine Learning-Based Feature Selection and Modular Workflows},
journal = {Journal of Molecular Biology},
pages = {169809},
year = {2026},
issn = {0022-2836},
doi = {https://doi.org/10.1016/j.jmb.2026.169809},
url = {https://www.sciencedirect.com/science/article/pii/S0022283626001828},
author = {Maximilian Salomon and Maik Pankonin and Maeve Branwen Butler and Hossein Batebi and Peter F. Stadler and Peter W. Hildebrand and Guillermo Pérez-Hernández},
keywords = {Molecular Dynamics, Machine Learning, Explainability, FAIR Principles, Computational Biophysics},
abstract = {Molecular dynamics (MD) simulations provide detailed, time-resolved insight into molecular motion. Advances in hardware and software now make very large systems accessible, increasing the need for efficient tools to analyze the resulting trajectories. We introduce mdxplain, a high-level Python API that facilitates the creation of scalable, streamlined, and reusable analysis pipelines for large MD datasets with only a few lines of code. A unified object exposes all functionality, combining typical MD featurization and MD metrics with dimensionality reduction, clustering and feature selection via decision trees, supporting expert and non-expert users in identifying structural patterns and explain the dynamic behavior of their systems. Leveraging metadata annotations for trajectory- and residue-selection, mdxplain can handle multiple topologies in a single execution and uses optimized memory handling to process large datasets (millions of frames) efficiently. Its reports include distributional and time-series plots, representative conformations and decision trees combined with optional 3D visualization via PyMOL and NGLView. Pipelines can be exported at all time, bundling all relevant data for reuse, ensuring reproducibility and FAIR compliance. The Python API, together with documentation, examples, and tutorials is available on github.com/maximilian-salomon/mdxplain and on mdxplain.de.}
}