@inproceedings{shan2020lcfi,title={LCFI: A Fault Injection Tool for Studying Lossy Compression Error Propagation in HPC Programs},author={Shan, Baodi and Shamji, Aabid and Tian, Jiannan and Li, Guanpeng and Tao, Dingwen},booktitle={2020 IEEE International Conference on Big Data (Big Data)},pages={2708--2715},year={2020},organization={IEEE},}
LLVM/OpenMP
Towards Efficient Remote OpenMP Offloading
Lu, Wenbin, Shan, Baodi, Raut, Eric, Meng, Jie, Araya-Polo, Mauricio, Doerfert, Johannes, Malik, Abid M., and Chapman, Barbara
In OpenMP in a Modern World: From Multi-device Support to Meta Programming 2022
On modern heterogeneous HPC systems, the most popular way to realize distributed computation is the hybrid programming model of MPI+X (X being OpenMP/CUDA/etc.), as it has been proven to perform well with various scientific applications. However, application developers prefer to use a single coherent programming model over a hybrid model, as maintainability and portability decrease per additional model. Recent work [14] has shown that the OpenMP device offloading model could be used to program distributed accelerator-based HPC systems with minimal changes to the application.
@inproceedings{10.1007/978-3-031-15922-0_2,author={Lu, Wenbin and Shan, Baodi and Raut, Eric and Meng, Jie and Araya-Polo, Mauricio and Doerfert, Johannes and Malik, Abid M. and Chapman, Barbara},editor={Klemm, Michael and de Supinski, Bronis R. and Klinkenberg, Jannis and Neth, Brandon},title={Towards Efficient Remote OpenMP Offloading},booktitle={OpenMP in a Modern World: From Multi-device Support to Meta Programming},year={2022},publisher={Springer International Publishing},address={Cham},pages={17--31},isbn={978-3-031-15922-0},}
LLVM/OpenMP
MPI-Based Remote OpenMP Offloading: A More Efficient and Easy-to-Use Implementation
Shan, Baodi, Araya-Polo, Mauricio, Malik, Abid M., and Chapman, Barbara
In Proceedings of the 14th International Workshop on Programming Models and Applications for Multicores and Manycores 2023
@inproceedings{10.1145/3582514.3582519,author={Shan, Baodi and Araya-Polo, Mauricio and Malik, Abid M. and Chapman, Barbara},title={MPI-Based Remote OpenMP Offloading: A More Efficient and Easy-to-Use Implementation},year={2023},isbn={9798400701153},publisher={Association for Computing Machinery},address={New York, NY, USA},url={https://doi.org/10.1145/3582514.3582519},doi={10.1145/3582514.3582519},booktitle={Proceedings of the 14th International Workshop on Programming Models and Applications for Multicores and Manycores},pages={50--59},numpages={10},keywords={OpenMP, distributed computing, GPGPU},location={Montreal, QC, Canada},series={PMAM'23},}
Insitutate For Advanced Computational Science Building, Stony Brook, NY 11790, USA