@inproceedings{ author={ C. Chen, J. Yao, H. Subramoni, D. Panda }, title={ Design and Optimization of GPU-Aware MPI Allreduce Using Direct Sendrecv Communication }, conference={ 54th International Conference on Parallel Processing }, year={ 2025 }, month={ September }, location={ San Diego, California }, source={ http://nowlab.cse.ohio-state.edu/publications/ }, }