@inproceedings{0b92049908cd405998862c6fde709b99,
title = "Automatic HBM Management: Models and Algorithms",
abstract = "Some past and future supercomputer nodes incorporate High- Bandwidth Memory (HBM). Compared to standard DRAM, HBM has similar latency, higher bandwidth and lower capacity. In this paper, we evaluate algorithms for managing High- Bandwidth Memory automatically. Previous work suggests that, in the worst case, performance is extremely sensitive to the policy for managing the channel to DRAM. Prior theory shows that a priority-based scheme (where there is a static strict priority-order among p threads for channel access) is O(1)-competitive, but FIFO is not, and in the worst case is ?(p) competitive. Following this theoretical guidance would be a disruptive change for vendors, who currently use FIFO variants in their DRAMcontroller hardware. Our goal is to determine theoretically and empirically whether we can justify recommending investment in priority-based DRAM controller hardware. In order to experiment with DRAM channel protocols, we chose a theoretical model, validated it against real hardware, and implemented a basic simulator. We corroborated the previous theoretical results for the model, conducted a parameter sweep while running our simulator on address traces from memory bandwidth-bound codes (GNU sort and TACO sparse matrix-vector product), and designed better channel-access algorithms.",
keywords = "dynamic priority, fairness, far-channel arbitration, fcfs, fifo, first-come-first-serve, first-in-first-out, hbm, high-bandwidth memory, knight's landing, knl, lru, makespan, memory hierarchy, memory management, priority queue, queue management, sapphire rapids, scheduling, timeliness, xeon phi",
author = "Daniel Delayo and Kenny Zhang and Kunal Agrawal and Bender, \{Michael A.\} and Berry, \{Jonathan W.\} and Rathish Das and Benjamin Moseley and Phillips, \{Cynthia A.\}",
note = "Publisher Copyright: {\textcopyright} 2022 ACM.; 34th ACM Symposium on Parallelism in Algorithms and Architectures, SPAA 2022 ; Conference date: 11-07-2022 Through 14-07-2022",
year = "2022",
month = jul,
day = "11",
doi = "10.1145/3490148.3538570",
language = "English",
series = "Annual ACM Symposium on Parallelism in Algorithms and Architectures",
publisher = "Association for Computing Machinery",
pages = "147--159",
booktitle = "SPAA 2022 - Proceedings of the 34th ACM Symposium on Parallelism in Algorithms and Architectures",
}