Skip to content

Commit fc250c2

Browse files
authored
TL: updated arxiv link
1 parent c490446 commit fc250c2

File tree

1 file changed

+2
-2
lines changed

1 file changed

+2
-2
lines changed

_bibliography/pint.bib

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -8141,9 +8141,9 @@ @article{PeterssonEtAl2025b
81418141
@unpublished{RoseEtAl2025,
81428142
abstract = {In the quest for highest performance in scientific computing, we present a novel framework that relies on high-bandwidth communication between GPUs in a compute cluster. The framework offers linear scaling of performance for explicit algorithms that is only limited by the size of the dataset and the number of GPUs. Slices of the dataset propagate in a ring of processes (GPUs) from one GPU, where they are processed, to the next, which results in a parallel-in-time parallelization. The user of the framework has to write GPU kernels that implement the algorithm and provide slices of the dataset. Knowledge about the underlying parallelization strategy is not required because the communication between processes is carried out by the framework. As a case study, molecular dynamics simulation based on the Lennard-Jones potential is implemented to measure the performance for a homogeneous fluid. Single node performance and strong scaling behavior of this framework is compared to LAMMPS, which is outperformed in the strong scaling case.},
81438143
author = {Martin Rose and Simon Homes and Lukas Ramsperger and Jose Gracia and Christoph Niethammer and Jadran Vrabec},
8144-
howpublished = {arXiv:2507.11289v1 [cs.DC]},
8144+
howpublished = {arXiv:2507.11289 [cs.DC]},
81458145
title = {Cyclic Data Streaming on GPUs for Short Range Stencils Applied to Molecular Dynamics},
8146-
url = {http://arxiv.org/abs/2507.11289v1},
8146+
url = {http://arxiv.org/abs/2507.11289},
81478147
year = {2025},
81488148
}
81498149

0 commit comments

Comments
 (0)