@inproceedings{657b12eac1e24dc387468831694929bd,
title = "FOURST: A code generator for FFT-based fast stencil computations",
abstract = "Stencil computations are ubiquitous in modern grid-based physical simulations. In this paper, we present FOURST - a compiler to generate programs computing time iterated linear periodic and aperiodic stencil computations with fast Fourier transform methods. This paper outlines the design and implementation of the code generation approach in FOURST, to automatically generate FFT-based stencil solvers. We present experimental results on the state-of-the-art Ookami supercomputer housing Fujitsu A64FX and Intel Skylake processors, to study the performance of FOURST and a state-of-the-art tiling-based optimized code generator PLuTo on various stencil shapes and varying the number of time iterations. We discuss the performance profiles, and limitations, of both approaches on high-end modern hardware.",
keywords = "FFT, FOURST, Fast Stencil Computation, Fast-Fourier Transform, Grid Simulation, Simulation, Stencil, Stencil Computations",
author = "Zafar Ahmad and Javanmard, \{Mohammad Mahdi\} and Gregory Croisdale and Aaron Gregory and Pramod Ganapathi and Pouchet, \{Louis Noel\} and Rezaul Chowdhury",
note = "Publisher Copyright: {\textcopyright} 2022 IEEE.; 2022 IEEE International Symposium on Performance Analysis of Systems and Software, ISPASS 2022 ; Conference date: 22-05-2022 Through 24-05-2022",
year = "2022",
doi = "10.1109/ISPASS55109.2022.00010",
language = "English",
series = "Proceedings - 2022 IEEE International Symposium on Performance Analysis of Systems and Software, ISPASS 2022",
publisher = "Institute of Electrical and Electronics Engineers Inc.",
pages = "99--108",
booktitle = "Proceedings - 2022 IEEE International Symposium on Performance Analysis of Systems and Software, ISPASS 2022",
}