@inproceedings{ author={ C. Chen, N. Contini, L. Xu, J. Queiser, H. Subramoni, D. Panda }, title={ Design and Implementation of Casting Compression for GPU-Aware MPI Collectives }, conference={ 40th IEEE International Parallel & Distributed Processing Symposium }, year={ 2026 }, month={ May }, location={ New Orleans, USA }, source={ http://nowlab.cse.ohio-state.edu/publications/ }, }