@article{DBLP:journals/ijhpca/GuoRZBSAISCLOGZOABJSFDC25,
  author       = {Yanfei Guo and
                  Ken Raffenetti and
                  Hui Zhou and
                  Pavan Balaji and
                  Min Si and
                  Abdelhalim Amer and
                  Shintaro Iwasaki and
                  Sangmin Seo and
                  Giuseppe Congiu and
                  Robert Latham and
                  Lena Oden and
                  Thomas Gillis and
                  Rohit Zambre and
                  Kaiming Ouyang and
                  Charles Archer and
                  Wesley Bland and
                  Jithin Jose and
                  Sayantan Sur and
                  Hajime Fujita and
                  Dmitry Durnov and
                  Michael Chuvelev and
                  Gengbin Zheng and
                  Alex Brooks and
                  Sagar Thapaliya and
                  Taru Doodi and
                  Maria Garazan and
                  Steve Oyanagi and
                  Marc Snir and
                  Rajeev Thakur},
  title        = {Preparing {MPICH} for exascale},
  journal      = {Int. J. High Perform. Comput. Appl.},
  volume       = {39},
  number       = {2},
  pages        = {283--305},
  year         = {2025},
  url          = {https://doi.org/10.1177/10943420241311608},
  doi          = {10.1177/10943420241311608},
  timestamp    = {Tue, 15 Apr 2025 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/ijhpca/GuoRZBSAISCLOGZOABJSFDC25.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/ics/HuangD0ZLHRZ0LC24,
  author       = {Jiajun Huang and
                  Sheng Di and
                  Xiaodong Yu and
                  Yujia Zhai and
                  Jinyang Liu and
                  Yafan Huang and
                  Ken Raffenetti and
                  Hui Zhou and
                  Kai Zhao and
                  Xiaoyi Lu and
                  Zizhong Chen and
                  Franck Cappello and
                  Yanfei Guo and
                  Rajeev Thakur},
  editor       = {Kenji Kise and
                  Valentina Salapura and
                  Murali Annavaram and
                  Ana Lucia Varbanescu},
  title        = {gZCCL: Compression-Accelerated Collective Communication Framework
                  for {GPU} Clusters},
  booktitle    = {Proceedings of the 38th {ACM} International Conference on Supercomputing,
                  {ICS} 2024, Kyoto, Japan, June 4-7, 2024},
  pages        = {437--448},
  publisher    = {{ACM}},
  year         = {2024},
  url          = {https://doi.org/10.1145/3650200.3656636},
  doi          = {10.1145/3650200.3656636},
  timestamp    = {Wed, 16 Jul 2025 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/ics/HuangD0ZLHRZ0LC24.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/ipps/HuangD0ZZLLRZ0C24,
  author       = {Jiajun Huang and
                  Sheng Di and
                  Xiaodong Yu and
                  Yujia Zhai and
                  Zhaorui Zhang and
                  Jinyang Liu and
                  Xiaoyi Lu and
                  Ken Raffenetti and
                  Hui Zhou and
                  Kai Zhao and
                  Zizhong Chen and
                  Franck Cappello and
                  Yanfei Guo and
                  Rajeev Thakur},
  title        = {An Optimized Error-controlled {MPI} Collective Framework Integrated
                  with Lossy Compression},
  booktitle    = {{IEEE} International Parallel and Distributed Processing Symposium,
                  {IPDPS} 2024, San Francisco, CA, USA, May 27-31, 2024},
  pages        = {752--764},
  publisher    = {{IEEE}},
  year         = {2024},
  url          = {https://doi.org/10.1109/IPDPS57955.2024.00072},
  doi          = {10.1109/IPDPS57955.2024.00072},
  timestamp    = {Wed, 16 Jul 2025 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/ipps/HuangD0ZZLLRZ0C24.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/ppopp/HuangD0ZLHRZ0CC24,
  author       = {Jiajun Huang and
                  Sheng Di and
                  Xiaodong Yu and
                  Yujia Zhai and
                  Jinyang Liu and
                  Yafan Huang and
                  Ken Raffenetti and
                  Hui Zhou and
                  Kai Zhao and
                  Zizhong Chen and
                  Franck Cappello and
                  Yanfei Guo and
                  Rajeev Thakur},
  editor       = {Michel Steuwer and
                  I{-}Ting Angelina Lee and
                  Milind Chabbi},
  title        = {{POSTER:} Optimizing Collective Communications with Error-bounded
                  Lossy Compression for {GPU} Clusters},
  booktitle    = {Proceedings of the 29th {ACM} {SIGPLAN} Annual Symposium on Principles
                  and Practice of Parallel Programming, PPoPP 2024, Edinburgh, United
                  Kingdom, March 2-6, 2024},
  pages        = {454--456},
  publisher    = {{ACM}},
  year         = {2024},
  url          = {https://doi.org/10.1145/3627535.3638467},
  doi          = {10.1145/3627535.3638467},
  timestamp    = {Wed, 16 Jul 2025 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/ppopp/HuangD0ZLHRZ0CC24.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/sc/ZhouLRGT24,
  author       = {Hui Zhou and
                  Robert Latham and
                  Ken Raffenetti and
                  Yanfei Guo and
                  Rajeev Thakur},
  title        = {{MPI} Progress For All},
  booktitle    = {{SC24-W:} Workshops of the International Conference for High Performance
                  Computing, Networking, Storage and Analysis, Atlanta, GA, USA, November
                  17-22, 2024},
  pages        = {425--435},
  publisher    = {{IEEE}},
  year         = {2024},
  url          = {https://doi.org/10.1109/SCW63240.2024.00063},
  doi          = {10.1109/SCW63240.2024.00063},
  timestamp    = {Tue, 15 Apr 2025 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/sc/ZhouLRGT24.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/corr/abs-2401-16547,
  author       = {Hui Zhou and
                  Ken Raffenetti and
                  Wesley Bland and
                  Yanfei Guo},
  title        = {Generating Bindings in {MPICH}},
  journal      = {CoRR},
  volume       = {abs/2401.16547},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2401.16547},
  doi          = {10.48550/ARXIV.2401.16547},
  eprinttype    = {arXiv},
  eprint       = {2401.16547},
  timestamp    = {Tue, 15 Apr 2025 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2401-16547.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/cluster/HuangOZLSRZHCGT23,
  author       = {Jiajun Huang and
                  Kaiming Ouyang and
                  Yujia Zhai and
                  Jinyang Liu and
                  Min Si and
                  Ken Raffenetti and
                  Hui Zhou and
                  Atsushi Hori and
                  Zizhong Chen and
                  Yanfei Guo and
                  Rajeev Thakur},
  title        = {PiP-MColl: Process-in-Process-based Multi-object {MPI} Collectives},
  booktitle    = {{IEEE} International Conference on Cluster Computing, {CLUSTER} 2023,
                  Santa Fe, NM, USA, October 31 - Nov. 3, 2023},
  pages        = {354--364},
  publisher    = {{IEEE}},
  year         = {2023},
  url          = {https://doi.org/10.1109/CLUSTER52292.2023.00037},
  doi          = {10.1109/CLUSTER52292.2023.00037},
  timestamp    = {Wed, 16 Jul 2025 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/cluster/HuangOZLSRZHCGT23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/hpdc/HuangOZLSRZHCGT23,
  author       = {Jiajun Huang and
                  Kaiming Ouyang and
                  Yujia Zhai and
                  Jinyang Liu and
                  Min Si and
                  Ken Raffenetti and
                  Hui Zhou and
                  Atsushi Hori and
                  Zizhong Chen and
                  Yanfei Guo and
                  Rajeev Thakur},
  editor       = {Ali Raza Butt and
                  Ningfang Mi and
                  Kyle Chard},
  title        = {Accelerating {MPI} Collectives with Process-in-Process-based Multi-object
                  Techniques},
  booktitle    = {Proceedings of the 32nd International Symposium on High-Performance
                  Parallel and Distributed Computing, {HPDC} 2023, Orlando, FL, USA,
                  June 16-23, 2023},
  pages        = {333--334},
  publisher    = {{ACM}},
  year         = {2023},
  url          = {https://doi.org/10.1145/3588195.3595955},
  doi          = {10.1145/3588195.3595955},
  timestamp    = {Wed, 16 Jul 2025 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/hpdc/HuangOZLSRZHCGT23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/icpp/GillisRZGT23,
  author       = {Thomas Gillis and
                  Ken Raffenetti and
                  Hui Zhou and
                  Yanfei Guo and
                  Rajeev Thakur},
  title        = {Quantifying the Performance Benefits of Partitioned Communication
                  in {MPI}},
  booktitle    = {Proceedings of the 52nd International Conference on Parallel Processing,
                  {ICPP} 2023, Salt Lake City, UT, USA, August 7-10, 2023},
  pages        = {285--294},
  publisher    = {{ACM}},
  year         = {2023},
  url          = {https://doi.org/10.1145/3605573.3605599},
  doi          = {10.1145/3605573.3605599},
  timestamp    = {Tue, 15 Apr 2025 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icpp/GillisRZGT23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/pvm/ZhouRZGT23,
  author       = {Hui Zhou and
                  Ken Raffenetti and
                  Junchao Zhang and
                  Yanfei Guo and
                  Rajeev Thakur},
  title        = {Frustrated With MPI+Threads? Try MPIxThreads!},
  booktitle    = {Proceedings of the 30th European {MPI} Users' Group Meeting, EuroMPI
                  2023, Bristol, United Kingdom, September 11-13, 2023},
  pages        = {2:1--2:10},
  publisher    = {{ACM}},
  year         = {2023},
  url          = {https://doi.org/10.1145/3615318.3615320},
  doi          = {10.1145/3615318.3615320},
  timestamp    = {Tue, 15 Apr 2025 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/pvm/ZhouRZGT23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/pvm/ZhouRGT22,
  author       = {Hui Zhou and
                  Ken Raffenetti and
                  Yanfei Guo and
                  Rajeev Thakur},
  title        = {{MPIX} Stream: An Explicit Solution to Hybrid {MPI+X} Programming},
  booktitle    = {EuroMPI/USA'22: 29th European {MPI} Users' Group Meeting, Chattanooga,
                  TN, USA, September 26 - 28, 2022},
  pages        = {1--10},
  publisher    = {{ACM}},
  year         = {2022},
  url          = {https://doi.org/10.1145/3555819.3555820},
  doi          = {10.1145/3555819.3555820},
  timestamp    = {Tue, 15 Apr 2025 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/pvm/ZhouRGT22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/ics/AmerABCC0GGHIRS19,
  author       = {Abdelhalim Amer and
                  Charles Archer and
                  Michael Blocksome and
                  Chongxiao Cao and
                  Michael Chuvelev and
                  Hajime Fujita and
                  Maria Garzaran and
                  Yanfei Guo and
                  Jeff R. Hammond and
                  Shintaro Iwasaki and
                  Kenneth J. Raffenetti and
                  Mikhail Shiryaev and
                  Min Si and
                  Kenjiro Taura and
                  Sagar Thapaliya and
                  Pavan Balaji},
  editor       = {Rudolf Eigenmann and
                  Chen Ding and
                  Sally A. McKee},
  title        = {Software combining to mitigate multithreaded {MPI} contention},
  booktitle    = {Proceedings of the {ACM} International Conference on Supercomputing,
                  {ICS} 2019, Phoenix, AZ, USA, June 26-28, 2019},
  pages        = {367--379},
  publisher    = {{ACM}},
  year         = {2019},
  url          = {https://doi.org/10.1145/3330345.3330378},
  doi          = {10.1145/3330345.3330378},
  timestamp    = {Sun, 12 Nov 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/ics/AmerABCC0GGHIRS19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/ipps/GuoABPBRB17,
  author       = {Yanfei Guo and
                  Charles J. Archer and
                  Michael Blocksome and
                  Scott Parker and
                  Wesley Bland and
                  Ken Raffenetti and
                  Pavan Balaji},
  title        = {Memory Compression Techniques for Network Address Management in {MPI}},
  booktitle    = {2017 {IEEE} International Parallel and Distributed Processing Symposium,
                  {IPDPS} 2017, Orlando, FL, USA, May 29 - June 2, 2017},
  pages        = {1008--1017},
  publisher    = {{IEEE} Computer Society},
  year         = {2017},
  url          = {https://doi.org/10.1109/IPDPS.2017.18},
  doi          = {10.1109/IPDPS.2017.18},
  timestamp    = {Fri, 24 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/ipps/GuoABPBRB17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/sc/RaffenettiAOAB017,
  author       = {Ken Raffenetti and
                  Abdelhalim Amer and
                  Lena Oden and
                  Charles Archer and
                  Wesley Bland and
                  Hajime Fujita and
                  Yanfei Guo and
                  Tomislav Janjusic and
                  Dmitry Durnov and
                  Michael Blocksome and
                  Min Si and
                  Sangmin Seo and
                  Akhil Langer and
                  Gengbin Zheng and
                  Masamichi Takagi and
                  Paul K. Coffman and
                  Jithin Jose and
                  Sayantan Sur and
                  Alexander Sannikov and
                  Sergey Oblomov and
                  Michael Chuvelev and
                  Masayuki Hatanaka and
                  Xin Zhao and
                  Paul F. Fischer and
                  Thilina Rathnayake and
                  Matthew Otten and
                  Misun Min and
                  Pavan Balaji},
  editor       = {Bernd Mohr and
                  Padma Raghavan},
  title        = {Why is {MPI} so slow?: analyzing the fundamental limits in implementing
                  {MPI-3.1}},
  booktitle    = {Proceedings of the International Conference for High Performance Computing,
                  Networking, Storage and Analysis, {SC} 2017, Denver, CO, USA, November
                  12 - 17, 2017},
  pages        = {62},
  publisher    = {{ACM}},
  year         = {2017},
  url          = {https://doi.org/10.1145/3126908.3126963},
  doi          = {10.1145/3126908.3126963},
  timestamp    = {Tue, 07 May 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/sc/RaffenettiAOAB017.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/ccgrid/RaffenettiPB15,
  author       = {Ken Raffenetti and
                  Antonio J. Pe{\~{n}}a and
                  Pavan Balaji},
  title        = {Toward Implementing Robust Support for Portals 4 Networks in {MPICH}},
  booktitle    = {15th {IEEE/ACM} International Symposium on Cluster, Cloud and Grid
                  Computing, CCGrid 2015, Shenzhen, China, May 4-7, 2015},
  pages        = {1173--1176},
  publisher    = {{IEEE} Computer Society},
  year         = {2015},
  url          = {https://doi.org/10.1109/CCGrid.2015.79},
  doi          = {10.1109/CCGRID.2015.79},
  timestamp    = {Fri, 24 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/ccgrid/RaffenettiPB15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/pvm/ZhangLRB14,
  author       = {Junchao Zhang and
                  Bill Long and
                  Kenneth Raffenetti and
                  Pavan Balaji},
  editor       = {Jack J. Dongarra and
                  Yutaka Ishikawa and
                  Atsushi Hori},
  title        = {Implementing the {MPI-3.0} Fortran 2008 Binding},
  booktitle    = {21st European {MPI} Users' Group Meeting, EuroMPI/ASIA '14, Kyoto,
                  Japan - September 09 - 12, 2014},
  pages        = {1},
  publisher    = {{ACM}},
  year         = {2014},
  url          = {https://doi.org/10.1145/2642769.2642777},
  doi          = {10.1145/2642769.2642777},
  timestamp    = {Sun, 19 Jan 2025 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/pvm/ZhangLRB14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/sc/BlandRB14,
  author       = {Wesley Bland and
                  Kenneth Raffenetti and
                  Pavan Balaji},
  title        = {Simplifying the recovery model of user-level failure mitigation},
  booktitle    = {Proceedings of the 2014 Workshop on Exascale MPI, ExaMPI '14, New
                  Orleans, Louisiana, USA, November 16-21, 2014},
  pages        = {20--25},
  publisher    = {{IEEE}},
  year         = {2014},
  url          = {https://doi.org/10.1109/ExaMPI.2014.4},
  doi          = {10.1109/EXAMPI.2014.4},
  timestamp    = {Fri, 24 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/sc/BlandRB14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/cluster/WilkinsGTDH22,
  author       = {Michael Wilkins and
                  Yanfei Guo and
                  Rajeev Thakur and
                  Peter A. Dinda and
                  Nikos Hardavellas},
  title        = {ACCLAiM: Advancing the Practicality of {MPI} Collective Communication
                  Autotuning Using Machine Learning},
  booktitle    = {{IEEE} International Conference on Cluster Computing, {CLUSTER} 2022,
                  Heidelberg, Germany, September 5-8, 2022},
  pages        = {161--171},
  publisher    = {{IEEE}},
  year         = {2022},
  url          = {https://doi.org/10.1109/CLUSTER51413.2022.00030},
  doi          = {10.1109/CLUSTER51413.2022.00030},
  timestamp    = {Tue, 07 May 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/cluster/WilkinsGTDH22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/jocs/GroppTB21,
  author       = {William Gropp and
                  Rajeev Thakur and
                  Pavan Balaji},
  title        = {Translational research in the {MPICH} project},
  journal      = {J. Comput. Sci.},
  volume       = {52},
  pages        = {101203},
  year         = {2021},
  url          = {https://doi.org/10.1016/j.jocs.2020.101203},
  doi          = {10.1016/J.JOCS.2020.101203},
  timestamp    = {Thu, 14 Oct 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/jocs/GroppTB21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@proceedings{DBLP:conf/pvm/2017,
  editor       = {Antonio J. Pe{\~{n}}a and
                  Pavan Balaji and
                  William Gropp and
                  Rajeev Thakur},
  title        = {Proceedings of the 24th European {MPI} Users' Group Meeting, EuroMPI/USA
                  2017, Chicago, IL, USA, September 25-28, 2017},
  publisher    = {{ACM}},
  year         = {2017},
  url          = {http://dl.acm.org/citation.cfm?id=3127024},
  isbn         = {978-1-4503-4849-2},
  timestamp    = {Thu, 24 Aug 2017 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/pvm/2017.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/concurrency/DinanBBGGT16,
  author       = {James Dinan and
                  Pavan Balaji and
                  Darius Buntinas and
                  David Goodell and
                  William Gropp and
                  Rajeev Thakur},
  title        = {An implementation and evaluation of the {MPI} 3.0 one-sided communication
                  interface},
  journal      = {Concurr. Comput. Pract. Exp.},
  volume       = {28},
  number       = {17},
  pages        = {4385--4404},
  year         = {2016},
  url          = {https://doi.org/10.1002/cpe.3758},
  doi          = {10.1002/CPE.3758},
  timestamp    = {Tue, 21 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/concurrency/DinanBBGGT16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/tpds/AjiPJMCBBDFMMT16,
  author       = {Ashwin M. Aji and
                  Lokendra S. Panwar and
                  Feng Ji and
                  Karthik Murthy and
                  Milind Chabbi and
                  Pavan Balaji and
                  Keith R. Bisset and
                  James Dinan and
                  Wu{-}chun Feng and
                  John M. Mellor{-}Crummey and
                  Xiaosong Ma and
                  Rajeev Thakur},
  title        = {{MPI-ACC:} Accelerator-Aware {MPI} for Scientific Applications},
  journal      = {{IEEE} Trans. Parallel Distributed Syst.},
  volume       = {27},
  number       = {5},
  pages        = {1401--1414},
  year         = {2016},
  url          = {https://doi.org/10.1109/TPDS.2015.2446479},
  doi          = {10.1109/TPDS.2015.2446479},
  timestamp    = {Mon, 26 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/tpds/AjiPJMCBBDFMMT16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/topc/HoeflerDTBBGU15,
  author       = {Torsten Hoefler and
                  James Dinan and
                  Rajeev Thakur and
                  Brian Barrett and
                  Pavan Balaji and
                  William Gropp and
                  Keith D. Underwood},
  title        = {Remote Memory Access Programming in {MPI-3}},
  journal      = {{ACM} Trans. Parallel Comput.},
  volume       = {2},
  number       = {2},
  pages        = {9:1--9:26},
  year         = {2015},
  url          = {https://doi.org/10.1145/2780584},
  doi          = {10.1145/2780584},
  timestamp    = {Tue, 21 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/topc/HoeflerDTBBGU15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/ijhpca/DinanGBGMST14,
  author       = {James Dinan and
                  Ryan E. Grant and
                  Pavan Balaji and
                  David Goodell and
                  Douglas Miller and
                  Marc Snir and
                  Rajeev Thakur},
  title        = {Enabling communication concurrency through flexible {MPI} endpoints},
  journal      = {Int. J. High Perform. Comput. Appl.},
  volume       = {28},
  number       = {4},
  pages        = {390--405},
  year         = {2014},
  url          = {https://doi.org/10.1177/1094342014548772},
  doi          = {10.1177/1094342014548772},
  timestamp    = {Thu, 14 Oct 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/ijhpca/DinanGBGMST14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/tpds/JenkinsDBPST14,
  author       = {John Jenkins and
                  James Dinan and
                  Pavan Balaji and
                  Tom Peterka and
                  Nagiza F. Samatova and
                  Rajeev Thakur},
  title        = {Processing {MPI} Derived Datatypes on Noncontiguous GPU-Resident Data},
  journal      = {{IEEE} Trans. Parallel Distributed Syst.},
  volume       = {25},
  number       = {10},
  pages        = {2627--2637},
  year         = {2014},
  url          = {https://doi.org/10.1109/TPDS.2013.234},
  doi          = {10.1109/TPDS.2013.234},
  timestamp    = {Thu, 14 Oct 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/tpds/JenkinsDBPST14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/computing/HoeflerDBBBBGKT13,
  author       = {Torsten Hoefler and
                  James Dinan and
                  Darius Buntinas and
                  Pavan Balaji and
                  Brian Barrett and
                  Ron Brightwell and
                  William Gropp and
                  Vivek Kale and
                  Rajeev Thakur},
  title        = {{MPI} + {MPI:} a new hybrid approach to parallel programming with
                  {MPI} plus shared memory},
  journal      = {Computing},
  volume       = {95},
  number       = {12},
  pages        = {1121--1136},
  year         = {2013},
  url          = {https://doi.org/10.1007/s00607-013-0324-2},
  doi          = {10.1007/S00607-013-0324-2},
  timestamp    = {Thu, 14 Oct 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/computing/HoeflerDBBBBGKT13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/ccgrid/ZhaoBZDGBTAG13,
  author       = {Xin Zhao and
                  Darius Buntinas and
                  Judicael A. Zounmevo and
                  James Dinan and
                  David Goodell and
                  Pavan Balaji and
                  Rajeev Thakur and
                  Ahmad Afsahi and
                  William Gropp},
  title        = {Toward Asynchronous and MPI-Interoperable Active Messages},
  booktitle    = {13th {IEEE/ACM} International Symposium on Cluster, Cloud, and Grid
                  Computing, CCGrid 2013, Delft, Netherlands, May 13-16, 2013},
  pages        = {87--94},
  publisher    = {{IEEE} Computer Society},
  year         = {2013},
  url          = {https://doi.org/10.1109/CCGrid.2013.84},
  doi          = {10.1109/CCGRID.2013.84},
  timestamp    = {Fri, 24 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/ccgrid/ZhaoBZDGBTAG13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/dasc/ZhaoBGT13,
  author       = {Xin Zhao and
                  Pavan Balaji and
                  William Gropp and
                  Rajeev Thakur},
  title        = {Optimization Strategies for MPI-Interoperable Active Messages},
  booktitle    = {{IEEE} 11th International Conference on Dependable, Autonomic and
                  Secure Computing, {DASC} 2013, Chengdu, China, December 21-22, 2013},
  pages        = {508--515},
  publisher    = {{IEEE} Computer Society},
  year         = {2013},
  url          = {https://doi.org/10.1109/DASC.2013.116},
  doi          = {10.1109/DASC.2013.116},
  timestamp    = {Thu, 23 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/dasc/ZhaoBGT13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/hpdc/AjiPJCMBBDFMMT13,
  author       = {Ashwin M. Aji and
                  Lokendra S. Panwar and
                  Feng Ji and
                  Milind Chabbi and
                  Karthik Murthy and
                  Pavan Balaji and
                  Keith R. Bisset and
                  James Dinan and
                  Wu{-}chun Feng and
                  John M. Mellor{-}Crummey and
                  Xiaosong Ma and
                  Rajeev Thakur},
  editor       = {Manish Parashar and
                  Jon B. Weissman and
                  Dick H. J. Epema and
                  Renato J. O. Figueiredo},
  title        = {On the efficacy of GPU-integrated {MPI} for scientific applications},
  booktitle    = {The 22nd International Symposium on High-Performance Parallel and
                  Distributed Computing, HPDC'13, New York, NY, {USA} - June 17 - 21,
                  2013},
  pages        = {191--202},
  publisher    = {{ACM}},
  year         = {2013},
  url          = {https://dl.acm.org/citation.cfm?id=2462915},
  timestamp    = {Mon, 26 Nov 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/hpdc/AjiPJCMBBDFMMT13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/icpads/ZhaoBGT13,
  author       = {Xin Zhao and
                  Pavan Balaji and
                  William Gropp and
                  Rajeev Thakur},
  title        = {MPI-Interoperable Generalized Active Messages},
  booktitle    = {19th {IEEE} International Conference on Parallel and Distributed Systems,
                  {ICPADS} 2013, Seoul, Korea, December 15-18, 2013},
  pages        = {200--207},
  publisher    = {{IEEE} Computer Society},
  year         = {2013},
  url          = {https://doi.org/10.1109/ICPADS.2013.38},
  doi          = {10.1109/ICPADS.2013.38},
  timestamp    = {Thu, 23 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icpads/ZhaoBGT13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/ipps/AjiBDFT13,
  author       = {Ashwin M. Aji and
                  Pavan Balaji and
                  James Dinan and
                  Wu{-}chun Feng and
                  Rajeev Thakur},
  title        = {Synchronization and Ordering Semantics in Hybrid {MPI+GPU} Programming},
  booktitle    = {2013 {IEEE} International Symposium on Parallel {\&} Distributed Processing,
                  Workshops and Phd Forum, Cambridge, MA, USA, May 20-24, 2013},
  pages        = {1020--1029},
  publisher    = {{IEEE}},
  year         = {2013},
  url          = {https://doi.org/10.1109/IPDPSW.2013.256},
  doi          = {10.1109/IPDPSW.2013.256},
  timestamp    = {Fri, 24 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/ipps/AjiBDFT13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/pvm/DinanBGMST13,
  author       = {James Dinan and
                  Pavan Balaji and
                  David Goodell and
                  Douglas Miller and
                  Marc Snir and
                  Rajeev Thakur},
  editor       = {Jack J. Dongarra and
                  Javier Garc{\'{\i}}a Blas and
                  Jes{\'{u}}s Carretero},
  title        = {Enabling {MPI} interoperability through flexible communication endpoints},
  booktitle    = {20th European {MPI} Users's Group Meeting, EuroMPI '13, Madrid, Spain
                  - September 15 - 18, 2013},
  pages        = {13--18},
  publisher    = {{ACM}},
  year         = {2013},
  url          = {https://doi.org/10.1145/2488551.2488553},
  doi          = {10.1145/2488551.2488553},
  timestamp    = {Thu, 14 Oct 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/pvm/DinanBGMST13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/pvm/PenaCDBTG13,
  author       = {Antonio J. Pe{\~{n}}a and
                  Ralf G. Correa Carvalho and
                  James Dinan and
                  Pavan Balaji and
                  Rajeev Thakur and
                  William Gropp},
  editor       = {Jack J. Dongarra and
                  Javier Garc{\'{\i}}a Blas and
                  Jes{\'{u}}s Carretero},
  title        = {Analysis of topology-dependent {MPI} performance on Gemini networks},
  booktitle    = {20th European {MPI} Users's Group Meeting, EuroMPI '13, Madrid, Spain
                  - September 15 - 18, 2013},
  pages        = {61--66},
  publisher    = {{ACM}},
  year         = {2013},
  url          = {https://doi.org/10.1145/2488551.2488564},
  doi          = {10.1145/2488551.2488564},
  timestamp    = {Thu, 14 Oct 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/pvm/PenaCDBTG13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/cluster/JenkinsDBST12,
  author       = {John Jenkins and
                  James Dinan and
                  Pavan Balaji and
                  Nagiza F. Samatova and
                  Rajeev Thakur},
  title        = {Enabling Fast, Noncontiguous {GPU} Data Movement in Hybrid {MPI+GPU}
                  Environments},
  booktitle    = {2012 {IEEE} International Conference on Cluster Computing, {CLUSTER}
                  2012, Beijing, China, September 24-28, 2012},
  pages        = {468--476},
  publisher    = {{IEEE} Computer Society},
  year         = {2012},
  url          = {https://doi.org/10.1109/CLUSTER.2012.72},
  doi          = {10.1109/CLUSTER.2012.72},
  timestamp    = {Thu, 23 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/cluster/JenkinsDBST12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/hpcc/AjiDBBFBT12,
  author       = {Ashwin M. Aji and
                  James Dinan and
                  Darius Buntinas and
                  Pavan Balaji and
                  Wu{-}chun Feng and
                  Keith R. Bisset and
                  Rajeev Thakur},
  editor       = {Geyong Min and
                  Jia Hu and
                  Lei (Chris) Liu and
                  Laurence Tianruo Yang and
                  Seetharami Seelam and
                  Laurent Lef{\`{e}}vre},
  title        = {{MPI-ACC:} An Integrated and Extensible Approach to Data Movement
                  in Accelerator-based Systems},
  booktitle    = {14th {IEEE} International Conference on High Performance Computing
                  and Communication {\&} 9th {IEEE} International Conference on Embedded
                  Software and Systems, {HPCC-ICESS} 2012, Liverpool, United Kingdom,
                  June 25-27, 2012},
  pages        = {647--654},
  publisher    = {{IEEE} Computer Society},
  year         = {2012},
  url          = {https://doi.org/10.1109/HPCC.2012.92},
  doi          = {10.1109/HPCC.2012.92},
  timestamp    = {Fri, 24 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/hpcc/AjiDBBFBT12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/pvm/DinanGGTB12,
  author       = {James Dinan and
                  David Goodell and
                  William Gropp and
                  Rajeev Thakur and
                  Pavan Balaji},
  editor       = {Jesper Larsson Tr{\"{a}}ff and
                  Siegfried Benkner and
                  Jack J. Dongarra},
  title        = {Efficient Multithreaded Context {ID} Allocation in {MPI}},
  booktitle    = {Recent Advances in the Message Passing Interface - 19th European {MPI}
                  Users' Group Meeting, EuroMPI 2012, Vienna, Austria, September 23-26,
                  2012. Proceedings},
  series       = {Lecture Notes in Computer Science},
  volume       = {7490},
  pages        = {57--66},
  publisher    = {Springer},
  year         = {2012},
  url          = {https://doi.org/10.1007/978-3-642-33518-1\_11},
  doi          = {10.1007/978-3-642-33518-1\_11},
  timestamp    = {Thu, 14 Oct 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/pvm/DinanGGTB12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/pvm/GroppLT12,
  author       = {William Gropp and
                  Ewing L. Lusk and
                  Rajeev Thakur},
  editor       = {Jesper Larsson Tr{\"{a}}ff and
                  Siegfried Benkner and
                  Jack J. Dongarra},
  title        = {Advanced {MPI} Including New {MPI-3} Features},
  booktitle    = {Recent Advances in the Message Passing Interface - 19th European {MPI}
                  Users' Group Meeting, EuroMPI 2012, Vienna, Austria, September 23-26,
                  2012. Proceedings},
  series       = {Lecture Notes in Computer Science},
  volume       = {7490},
  pages        = {14},
  publisher    = {Springer},
  year         = {2012},
  url          = {https://doi.org/10.1007/978-3-642-33518-1\_5},
  doi          = {10.1007/978-3-642-33518-1\_5},
  timestamp    = {Fri, 19 May 2017 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/pvm/GroppLT12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/pvm/HoeflerDBBBBGKT12,
  author       = {Torsten Hoefler and
                  James Dinan and
                  Darius Buntinas and
                  Pavan Balaji and
                  Brian W. Barrett and
                  Ron Brightwell and
                  William Gropp and
                  Vivek Kale and
                  Rajeev Thakur},
  editor       = {Jesper Larsson Tr{\"{a}}ff and
                  Siegfried Benkner and
                  Jack J. Dongarra},
  title        = {Leveraging MPI's One-Sided Communication Interface for Shared-Memory
                  Programming},
  booktitle    = {Recent Advances in the Message Passing Interface - 19th European {MPI}
                  Users' Group Meeting, EuroMPI 2012, Vienna, Austria, September 23-26,
                  2012. Proceedings},
  series       = {Lecture Notes in Computer Science},
  volume       = {7490},
  pages        = {132--141},
  publisher    = {Springer},
  year         = {2012},
  url          = {https://doi.org/10.1007/978-3-642-33518-1\_18},
  doi          = {10.1007/978-3-642-33518-1\_18},
  timestamp    = {Thu, 14 Oct 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/pvm/HoeflerDBBBBGKT12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/cacm/GopalakrishnanKSTGLSSB11,
  author       = {Ganesh Gopalakrishnan and
                  Robert M. Kirby and
                  Stephen F. Siegel and
                  Rajeev Thakur and
                  William Gropp and
                  Ewing L. Lusk and
                  Bronis R. de Supinski and
                  Martin Schulz and
                  Greg Bronevetsky},
  title        = {Formal analysis of MPI-based parallel programs},
  journal      = {Commun. {ACM}},
  volume       = {54},
  number       = {12},
  pages        = {82--91},
  year         = {2011},
  url          = {https://doi.org/10.1145/2043174.2043194},
  doi          = {10.1145/2043174.2043194},
  timestamp    = {Mon, 03 Mar 2025 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/cacm/GopalakrishnanKSTGLSSB11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/concurrency/HoeflerRRSTT11,
  author       = {Torsten Hoefler and
                  Rolf Rabenseifner and
                  Hubert Ritzdorf and
                  Bronis R. de Supinski and
                  Rajeev Thakur and
                  Jesper Larsson Tr{\"{a}}ff},
  title        = {The scalable process topology interface of {MPI} 2.2},
  journal      = {Concurr. Comput. Pract. Exp.},
  volume       = {23},
  number       = {4},
  pages        = {293--310},
  year         = {2011},
  url          = {https://doi.org/10.1002/cpe.1643},
  doi          = {10.1002/CPE.1643},
  timestamp    = {Thu, 14 Oct 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/concurrency/HoeflerRRSTT11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/ppl/BalajiBGGHKLTT11,
  author       = {Pavan Balaji and
                  Darius Buntinas and
                  David Goodell and
                  William Gropp and
                  Torsten Hoefler and
                  Sameer Kumar and
                  Ewing L. Lusk and
                  Rajeev Thakur and
                  Jesper Larsson Tr{\"{a}}ff},
  title        = {Mpi on millions of Cores},
  journal      = {Parallel Process. Lett.},
  volume       = {21},
  number       = {1},
  pages        = {45--60},
  year         = {2011},
  url          = {https://doi.org/10.1142/S0129626411000060},
  doi          = {10.1142/S0129626411000060},
  timestamp    = {Thu, 14 Oct 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/ppl/BalajiBGGHKLTT11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/pvm/GoodellGZT11,
  author       = {David Goodell and
                  William Gropp and
                  Xin Zhao and
                  Rajeev Thakur},
  editor       = {Yiannis Cotronis and
                  Anthony Danalis and
                  Dimitrios S. Nikolopoulos and
                  Jack J. Dongarra},
  title        = {Scalable Memory Use in {MPI:} {A} Case Study with {MPICH2}},
  booktitle    = {Recent Advances in the Message Passing Interface - 18th European {MPI}
                  Users' Group Meeting, EuroMPI 2011, Santorini, Greece, September 18-21,
                  2011. Proceedings},
  series       = {Lecture Notes in Computer Science},
  volume       = {6960},
  pages        = {140--149},
  publisher    = {Springer},
  year         = {2011},
  url          = {https://doi.org/10.1007/978-3-642-24449-0\_17},
  doi          = {10.1007/978-3-642-24449-0\_17},
  timestamp    = {Thu, 14 Oct 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/pvm/GoodellGZT11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/pvm/GroppHTT11,
  author       = {William Gropp and
                  Torsten Hoefler and
                  Rajeev Thakur and
                  Jesper Larsson Tr{\"{a}}ff},
  editor       = {Yiannis Cotronis and
                  Anthony Danalis and
                  Dimitrios S. Nikolopoulos and
                  Jack J. Dongarra},
  title        = {Performance Expectations and Guidelines for {MPI} Derived Datatypes},
  booktitle    = {Recent Advances in the Message Passing Interface - 18th European {MPI}
                  Users' Group Meeting, EuroMPI 2011, Santorini, Greece, September 18-21,
                  2011. Proceedings},
  series       = {Lecture Notes in Computer Science},
  volume       = {6960},
  pages        = {150--159},
  publisher    = {Springer},
  year         = {2011},
  url          = {https://doi.org/10.1007/978-3-642-24449-0\_18},
  doi          = {10.1007/978-3-642-24449-0\_18},
  timestamp    = {Thu, 14 Oct 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/pvm/GroppHTT11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/ijhpca/BalajiBGGT10,
  author       = {Pavan Balaji and
                  Darius Buntinas and
                  David Goodell and
                  William Gropp and
                  Rajeev Thakur},
  title        = {Fine-Grained Multithreading Support for Hybrid Threaded {MPI} Programming},
  journal      = {Int. J. High Perform. Comput. Appl.},
  volume       = {24},
  number       = {1},
  pages        = {49--57},
  year         = {2010},
  url          = {https://doi.org/10.1177/1094342009360206},
  doi          = {10.1177/1094342009360206},
  timestamp    = {Thu, 12 Mar 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/ijhpca/BalajiBGGT10.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/ijhpca/BalajiCGTL10,
  author       = {Pavan Balaji and
                  Anthony Chan and
                  William Gropp and
                  Rajeev Thakur and
                  Ewing L. Lusk},
  title        = {The Importance of Non-Data-Communication Overheads in {MPI}},
  journal      = {Int. J. High Perform. Comput. Appl.},
  volume       = {24},
  number       = {1},
  pages        = {5--15},
  year         = {2010},
  url          = {https://doi.org/10.1177/1094342009359258},
  doi          = {10.1177/1094342009359258},
  timestamp    = {Thu, 12 Mar 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/ijhpca/BalajiCGTL10.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/spe/PervezGKTG10,
  author       = {Salman Pervez and
                  Ganesh Gopalakrishnan and
                  Robert M. Kirby and
                  Rajeev Thakur and
                  William Gropp},
  title        = {Formal methods applied to high-performance computing software design:
                  a case study of {MPI} one-sided communication-based locking},
  journal      = {Softw. Pract. Exp.},
  volume       = {40},
  number       = {1},
  pages        = {23--43},
  year         = {2010},
  url          = {https://doi.org/10.1002/spe.946},
  doi          = {10.1002/SPE.946},
  timestamp    = {Mon, 03 Mar 2025 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/spe/PervezGKTG10.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/tpds/TraffGT10,
  author       = {Jesper Larsson Tr{\"{a}}ff and
                  William D. Gropp and
                  Rajeev Thakur},
  title        = {Self-Consistent {MPI} Performance Guidelines},
  journal      = {{IEEE} Trans. Parallel Distributed Syst.},
  volume       = {21},
  number       = {5},
  pages        = {698--709},
  year         = {2010},
  url          = {https://doi.org/10.1109/TPDS.2009.120},
  doi          = {10.1109/TPDS.2009.120},
  timestamp    = {Thu, 14 Oct 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/tpds/TraffGT10.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/cf/DinanBLST10,
  author       = {James Dinan and
                  Pavan Balaji and
                  Ewing L. Lusk and
                  P. Sadayappan and
                  Rajeev Thakur},
  editor       = {Nancy M. Amato and
                  Hubertus Franke and
                  Paul H. J. Kelly},
  title        = {Hybrid parallel programming with {MPI} and unified parallel {C}},
  booktitle    = {Proceedings of the 7th Conference on Computing Frontiers, 2010, Bertinoro,
                  Italy, May 17-19, 2010},
  pages        = {177--186},
  publisher    = {{ACM}},
  year         = {2010},
  url          = {https://doi.org/10.1145/1787275.1787323},
  doi          = {10.1145/1787275.1787323},
  timestamp    = {Thu, 14 Oct 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/cf/DinanBLST10.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/cluster/GoodellBBDGKST10,
  author       = {David Goodell and
                  Pavan Balaji and
                  Darius Buntinas and
                  G{\'{a}}bor D{\'{o}}zsa and
                  William Gropp and
                  Sameer Kumar and
                  Bronis R. de Supinski and
                  Rajeev Thakur},
  title        = {Minimizing {MPI} Resource Contention in Multithreaded Multicore Environments},
  booktitle    = {Proceedings of the 2010 {IEEE} International Conference on Cluster
                  Computing, Heraklion, Crete, Greece, 20-24 September, 2010},
  pages        = {1--8},
  publisher    = {{IEEE} Computer Society},
  year         = {2010},
  url          = {https://doi.org/10.1109/CLUSTER.2010.11},
  doi          = {10.1109/CLUSTER.2010.11},
  timestamp    = {Thu, 23 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/cluster/GoodellBBDGKST10.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/pvm/DozsaKBBGGRT10,
  author       = {G{\'{a}}bor D{\'{o}}zsa and
                  Sameer Kumar and
                  Pavan Balaji and
                  Darius Buntinas and
                  David Goodell and
                  William Gropp and
                  Joe Ratterman and
                  Rajeev Thakur},
  editor       = {Rainer Keller and
                  Edgar Gabriel and
                  Michael M. Resch and
                  Jack J. Dongarra},
  title        = {Enabling Concurrent Multithreaded {MPI} Communication on Multicore
                  Petascale Systems},
  booktitle    = {Recent Advances in the Message Passing Interface - 17th European {MPI}
                  Users' Group Meeting, EuroMPI 2010, Stuttgart, Germany, September
                  12-15, 2010. Proceedings},
  series       = {Lecture Notes in Computer Science},
  volume       = {6305},
  pages        = {11--20},
  publisher    = {Springer},
  year         = {2010},
  url          = {https://doi.org/10.1007/978-3-642-15646-5\_2},
  doi          = {10.1007/978-3-642-15646-5\_2},
  timestamp    = {Thu, 14 Oct 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/pvm/DozsaKBBGGRT10.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/pvm/HoeflerGTT10,
  author       = {Torsten Hoefler and
                  William Gropp and
                  Rajeev Thakur and
                  Jesper Larsson Tr{\"{a}}ff},
  editor       = {Rainer Keller and
                  Edgar Gabriel and
                  Michael M. Resch and
                  Jack J. Dongarra},
  title        = {Toward Performance Models of {MPI} Implementations for Understanding
                  Application Scaling Issues},
  booktitle    = {Recent Advances in the Message Passing Interface - 17th European {MPI}
                  Users' Group Meeting, EuroMPI 2010, Stuttgart, Germany, September
                  12-15, 2010. Proceedings},
  series       = {Lecture Notes in Computer Science},
  volume       = {6305},
  pages        = {21--30},
  publisher    = {Springer},
  year         = {2010},
  url          = {https://doi.org/10.1007/978-3-642-15646-5\_3},
  doi          = {10.1007/978-3-642-15646-5\_3},
  timestamp    = {Thu, 14 Oct 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/pvm/HoeflerGTT10.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/pvm/KrishnaBLTT10,
  author       = {Jayesh Krishna and
                  Pavan Balaji and
                  Ewing L. Lusk and
                  Rajeev Thakur and
                  Fabian Tiller},
  editor       = {Rainer Keller and
                  Edgar Gabriel and
                  Michael M. Resch and
                  Jack J. Dongarra},
  title        = {Implementing {MPI} on Windows: Comparison with Common Approaches on
                  Unix},
  booktitle    = {Recent Advances in the Message Passing Interface - 17th European {MPI}
                  Users' Group Meeting, EuroMPI 2010, Stuttgart, Germany, September
                  12-15, 2010. Proceedings},
  series       = {Lecture Notes in Computer Science},
  volume       = {6305},
  pages        = {160--169},
  publisher    = {Springer},
  year         = {2010},
  url          = {https://doi.org/10.1007/978-3-642-15646-5\_17},
  doi          = {10.1007/978-3-642-15646-5\_17},
  timestamp    = {Thu, 14 Oct 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/pvm/KrishnaBLTT10.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/ife/BalajiCTGL09,
  author       = {Pavan Balaji and
                  Anthony Chan and
                  Rajeev Thakur and
                  William Gropp and
                  Ewing L. Lusk},
  title        = {Toward message passing for a million processes: characterizing {MPI}
                  on a massive scale blue gene/P},
  journal      = {Comput. Sci. Res. Dev.},
  volume       = {24},
  number       = {1-2},
  pages        = {11--19},
  year         = {2009},
  url          = {https://doi.org/10.1007/s00450-009-0095-3},
  doi          = {10.1007/S00450-009-0095-3},
  timestamp    = {Thu, 14 Oct 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/ife/BalajiCTGL09.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/pc/ThakurG09,
  author       = {Rajeev Thakur and
                  William Gropp},
  title        = {Test suite for evaluating performance of multithreaded {MPI} communication},
  journal      = {Parallel Comput.},
  volume       = {35},
  number       = {12},
  pages        = {608--617},
  year         = {2009},
  url          = {https://doi.org/10.1016/j.parco.2008.12.013},
  doi          = {10.1016/J.PARCO.2008.12.013},
  timestamp    = {Thu, 14 Oct 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/pc/ThakurG09.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/icpp/TipparajuGRTT09,
  author       = {Vinod Tipparaju and
                  William Gropp and
                  Hubert Ritzdorf and
                  Rajeev Thakur and
                  Jesper Larsson Tr{\"{a}}ff},
  title        = {Investigating High Performance {RMA} Interfaces for the {MPI-3} Standard},
  booktitle    = {{ICPP} 2009, International Conference on Parallel Processing, Vienna,
                  Austria, 22-25 September 2009},
  pages        = {293--300},
  publisher    = {{IEEE} Computer Society},
  year         = {2009},
  url          = {https://doi.org/10.1109/ICPP.2009.54},
  doi          = {10.1109/ICPP.2009.54},
  timestamp    = {Fri, 24 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icpp/TipparajuGRTT09.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/ppopp/VoVDGKT09,
  author       = {Anh Vo and
                  Sarvani S. Vakkalanka and
                  Michael Delisi and
                  Ganesh Gopalakrishnan and
                  Robert M. Kirby and
                  Rajeev Thakur},
  editor       = {Daniel A. Reed and
                  Vivek Sarkar},
  title        = {Formal verification of practical {MPI} programs},
  booktitle    = {Proceedings of the 14th {ACM} {SIGPLAN} Symposium on Principles and
                  Practice of Parallel Programming, {PPOPP} 2009, Raleigh, NC, USA,
                  February 14-18, 2009},
  pages        = {261--270},
  publisher    = {{ACM}},
  year         = {2009},
  url          = {https://doi.org/10.1145/1504176.1504214},
  doi          = {10.1145/1504176.1504214},
  timestamp    = {Mon, 03 Mar 2025 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/ppopp/VoVDGKT09.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/pvm/AananthakrishnanDVVGKT09,
  author       = {Sriram Aananthakrishnan and
                  Michael Delisi and
                  Sarvani S. Vakkalanka and
                  Anh Vo and
                  Ganesh Gopalakrishnan and
                  Robert M. Kirby and
                  Rajeev Thakur},
  editor       = {Matti Ropo and
                  Jan Westerholm and
                  Jack J. Dongarra},
  title        = {How Formal Dynamic Verification Tools Facilitate Novel Concurrency
                  Visualizations},
  booktitle    = {Recent Advances in Parallel Virtual Machine and Message Passing Interface,
                  16th European {PVM/MPI} Users' Group Meeting, Espoo, Finland, September
                  7-10, 2009. Proceedings},
  series       = {Lecture Notes in Computer Science},
  volume       = {5759},
  pages        = {261--270},
  publisher    = {Springer},
  year         = {2009},
  url          = {https://doi.org/10.1007/978-3-642-03770-2\_32},
  doi          = {10.1007/978-3-642-03770-2\_32},
  timestamp    = {Mon, 03 Mar 2025 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/pvm/AananthakrishnanDVVGKT09.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/pvm/BalajiBGGKLTT09,
  author       = {Pavan Balaji and
                  Darius Buntinas and
                  David Goodell and
                  William Gropp and
                  Sameer Kumar and
                  Ewing L. Lusk and
                  Rajeev Thakur and
                  Jesper Larsson Tr{\"{a}}ff},
  editor       = {Matti Ropo and
                  Jan Westerholm and
                  Jack J. Dongarra},
  title        = {{MPI} on a Million Processors},
  booktitle    = {Recent Advances in Parallel Virtual Machine and Message Passing Interface,
                  16th European {PVM/MPI} Users' Group Meeting, Espoo, Finland, September
                  7-10, 2009. Proceedings},
  series       = {Lecture Notes in Computer Science},
  volume       = {5759},
  pages        = {20--30},
  publisher    = {Springer},
  year         = {2009},
  url          = {https://doi.org/10.1007/978-3-642-03770-2\_9},
  doi          = {10.1007/978-3-642-03770-2\_9},
  timestamp    = {Tue, 21 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/pvm/BalajiBGGKLTT09.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/pvm/RossLGLT09,
  author       = {Robert B. Ross and
                  Robert Latham and
                  William Gropp and
                  Ewing L. Lusk and
                  Rajeev Thakur},
  editor       = {Matti Ropo and
                  Jan Westerholm and
                  Jack J. Dongarra},
  title        = {Processing {MPI} Datatypes Outside {MPI}},
  booktitle    = {Recent Advances in Parallel Virtual Machine and Message Passing Interface,
                  16th European {PVM/MPI} Users' Group Meeting, Espoo, Finland, September
                  7-10, 2009. Proceedings},
  series       = {Lecture Notes in Computer Science},
  volume       = {5759},
  pages        = {42--53},
  publisher    = {Springer},
  year         = {2009},
  url          = {https://doi.org/10.1007/978-3-642-03770-2\_11},
  doi          = {10.1007/978-3-642-03770-2\_11},
  timestamp    = {Tue, 21 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/pvm/RossLGLT09.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/pvm/SehrishWT09,
  author       = {Saba Sehrish and
                  Jun Wang and
                  Rajeev Thakur},
  editor       = {Matti Ropo and
                  Jan Westerholm and
                  Jack J. Dongarra},
  title        = {Conflict Detection Algorithm to Minimize Locking for {MPI-IO} Atomicity},
  booktitle    = {Recent Advances in Parallel Virtual Machine and Message Passing Interface,
                  16th European {PVM/MPI} Users' Group Meeting, Espoo, Finland, September
                  7-10, 2009. Proceedings},
  series       = {Lecture Notes in Computer Science},
  volume       = {5759},
  pages        = {143--153},
  publisher    = {Springer},
  year         = {2009},
  url          = {https://doi.org/10.1007/978-3-642-03770-2\_21},
  doi          = {10.1007/978-3-642-03770-2\_21},
  timestamp    = {Fri, 19 May 2017 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/pvm/SehrishWT09.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/pvm/VakkalankaSVGKT09,
  author       = {Sarvani S. Vakkalanka and
                  Grzegorz Szubzda and
                  Anh Vo and
                  Ganesh Gopalakrishnan and
                  Robert M. Kirby and
                  Rajeev Thakur},
  editor       = {Matti Ropo and
                  Jan Westerholm and
                  Jack J. Dongarra},
  title        = {Static-Analysis Assisted Dynamic Verification of {MPI} Waitany Programs
                  (Poster Abstract)},
  booktitle    = {Recent Advances in Parallel Virtual Machine and Message Passing Interface,
                  16th European {PVM/MPI} Users' Group Meeting, Espoo, Finland, September
                  7-10, 2009. Proceedings},
  series       = {Lecture Notes in Computer Science},
  volume       = {5759},
  pages        = {329--330},
  publisher    = {Springer},
  year         = {2009},
  url          = {https://doi.org/10.1007/978-3-642-03770-2\_43},
  doi          = {10.1007/978-3-642-03770-2\_43},
  timestamp    = {Mon, 03 Mar 2025 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/pvm/VakkalankaSVGKT09.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/pvm/VoVWGKT09,
  author       = {Anh Vo and
                  Sarvani S. Vakkalanka and
                  Jason Williams and
                  Ganesh Gopalakrishnan and
                  Robert M. Kirby and
                  Rajeev Thakur},
  editor       = {Matti Ropo and
                  Jan Westerholm and
                  Jack J. Dongarra},
  title        = {Sound and Efficient Dynamic Verification of {MPI} Programs with Probe
                  Non-determinism},
  booktitle    = {Recent Advances in Parallel Virtual Machine and Message Passing Interface,
                  16th European {PVM/MPI} Users' Group Meeting, Espoo, Finland, September
                  7-10, 2009. Proceedings},
  series       = {Lecture Notes in Computer Science},
  volume       = {5759},
  pages        = {271--281},
  publisher    = {Springer},
  year         = {2009},
  url          = {https://doi.org/10.1007/978-3-642-03770-2\_33},
  doi          = {10.1007/978-3-642-03770-2\_33},
  timestamp    = {Mon, 03 Mar 2025 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/pvm/VoVWGKT09.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/pvm/ZhuGGT09,
  author       = {Hao Zhu and
                  David Goodell and
                  William Gropp and
                  Rajeev Thakur},
  editor       = {Matti Ropo and
                  Jan Westerholm and
                  Jack J. Dongarra},
  title        = {Hierarchical Collectives in {MPICH2}},
  booktitle    = {Recent Advances in Parallel Virtual Machine and Message Passing Interface,
                  16th European {PVM/MPI} Users' Group Meeting, Espoo, Finland, September
                  7-10, 2009. Proceedings},
  series       = {Lecture Notes in Computer Science},
  volume       = {5759},
  pages        = {325--326},
  publisher    = {Springer},
  year         = {2009},
  url          = {https://doi.org/10.1007/978-3-642-03770-2\_41},
  doi          = {10.1007/978-3-642-03770-2\_41},
  timestamp    = {Sat, 30 Mar 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/pvm/ZhuGGT09.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/ppopp/BalajiFALKTM08,
  author       = {Pavan Balaji and
                  Wu{-}chun Feng and
                  Jeremy S. Archuleta and
                  Heshan Lin and
                  Rajkumar Kettimuthu and
                  Rajeev Thakur and
                  Xiaosong Ma},
  editor       = {Siddhartha Chatterjee and
                  Michael L. Scott},
  title        = {Semantics-based distributed {I/O} for mpiBLAST},
  booktitle    = {Proceedings of the 13th {ACM} {SIGPLAN} Symposium on Principles and
                  Practice of Parallel Programming, {PPOPP} 2008, Salt Lake City, UT,
                  USA, February 20-23, 2008},
  pages        = {293--294},
  publisher    = {{ACM}},
  year         = {2008},
  url          = {https://doi.org/10.1145/1345206.1345262},
  doi          = {10.1145/1345206.1345262},
  timestamp    = {Sun, 12 Jun 2022 19:46:08 +0200},
  biburl       = {https://dblp.org/rec/conf/ppopp/BalajiFALKTM08.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/pvm/BalajiBGGT08,
  author       = {Pavan Balaji and
                  Darius Buntinas and
                  David Goodell and
                  William Gropp and
                  Rajeev Thakur},
  editor       = {Alexey L. Lastovetsky and
                  M. Tahar Kechadi and
                  Jack J. Dongarra},
  title        = {Toward Efficient Support for Multithreaded {MPI} Communication},
  booktitle    = {Recent Advances in Parallel Virtual Machine and Message Passing Interface,
                  15th European {PVM/MPI} Users' Group Meeting, Dublin, Ireland, September
                  7-10, 2008. Proceedings},
  series       = {Lecture Notes in Computer Science},
  volume       = {5205},
  pages        = {120--129},
  publisher    = {Springer},
  year         = {2008},
  url          = {https://doi.org/10.1007/978-3-540-87475-1\_20},
  doi          = {10.1007/978-3-540-87475-1\_20},
  timestamp    = {Mon, 03 Jan 2022 22:32:15 +0100},
  biburl       = {https://dblp.org/rec/conf/pvm/BalajiBGGT08.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/pvm/BalajiCGTL08,
  author       = {Pavan Balaji and
                  Anthony Chan and
                  William Gropp and
                  Rajeev Thakur and
                  Ewing L. Lusk},
  editor       = {Alexey L. Lastovetsky and
                  M. Tahar Kechadi and
                  Jack J. Dongarra},
  title        = {Non-data-communication Overheads in {MPI:} Analysis on Blue Gene/P},
  booktitle    = {Recent Advances in Parallel Virtual Machine and Message Passing Interface,
                  15th European {PVM/MPI} Users' Group Meeting, Dublin, Ireland, September
                  7-10, 2008. Proceedings},
  series       = {Lecture Notes in Computer Science},
  volume       = {5205},
  pages        = {13--22},
  publisher    = {Springer},
  year         = {2008},
  url          = {https://doi.org/10.1007/978-3-540-87475-1\_9},
  doi          = {10.1007/978-3-540-87475-1\_9},
  timestamp    = {Thu, 14 Oct 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/pvm/BalajiCGTL08.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/pvm/GroppKRTT08,
  author       = {William D. Gropp and
                  Dries Kimpe and
                  Robert B. Ross and
                  Rajeev Thakur and
                  Jesper Larsson Tr{\"{a}}ff},
  editor       = {Alexey L. Lastovetsky and
                  M. Tahar Kechadi and
                  Jack J. Dongarra},
  title        = {Self-consistent {MPI-IO} Performance Requirements and Expectations},
  booktitle    = {Recent Advances in Parallel Virtual Machine and Message Passing Interface,
                  15th European {PVM/MPI} Users' Group Meeting, Dublin, Ireland, September
                  7-10, 2008. Proceedings},
  series       = {Lecture Notes in Computer Science},
  volume       = {5205},
  pages        = {167--176},
  publisher    = {Springer},
  year         = {2008},
  url          = {https://doi.org/10.1007/978-3-540-87475-1\_25},
  doi          = {10.1007/978-3-540-87475-1\_25},
  timestamp    = {Thu, 14 Oct 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/pvm/GroppKRTT08.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/pvm/SharmaVGKTG08,
  author       = {Subodh Sharma and
                  Sarvani S. Vakkalanka and
                  Ganesh Gopalakrishnan and
                  Robert M. Kirby and
                  Rajeev Thakur and
                  William Gropp},
  editor       = {Alexey L. Lastovetsky and
                  M. Tahar Kechadi and
                  Jack J. Dongarra},
  title        = {A Formal Approach to Detect Functionally Irrelevant Barriers in {MPI}
                  Programs},
  booktitle    = {Recent Advances in Parallel Virtual Machine and Message Passing Interface,
                  15th European {PVM/MPI} Users' Group Meeting, Dublin, Ireland, September
                  7-10, 2008. Proceedings},
  series       = {Lecture Notes in Computer Science},
  volume       = {5205},
  pages        = {265--273},
  publisher    = {Springer},
  year         = {2008},
  url          = {https://doi.org/10.1007/978-3-540-87475-1\_36},
  doi          = {10.1007/978-3-540-87475-1\_36},
  timestamp    = {Mon, 03 Mar 2025 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/pvm/SharmaVGKTG08.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/pvm/TraffRSBTG08,
  author       = {Jesper Larsson Tr{\"{a}}ff and
                  Andreas Ripke and
                  Christian Siebert and
                  Pavan Balaji and
                  Rajeev Thakur and
                  William Gropp},
  editor       = {Alexey L. Lastovetsky and
                  M. Tahar Kechadi and
                  Jack J. Dongarra},
  title        = {A Simple, Pipelined Algorithm for Large, Irregular All-gather Problems},
  booktitle    = {Recent Advances in Parallel Virtual Machine and Message Passing Interface,
                  15th European {PVM/MPI} Users' Group Meeting, Dublin, Ireland, September
                  7-10, 2008. Proceedings},
  series       = {Lecture Notes in Computer Science},
  volume       = {5205},
  pages        = {84--93},
  publisher    = {Springer},
  year         = {2008},
  url          = {https://doi.org/10.1007/978-3-540-87475-1\_16},
  doi          = {10.1007/978-3-540-87475-1\_16},
  timestamp    = {Thu, 14 Oct 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/pvm/TraffRSBTG08.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/pvm/VakkalankaDGKTG08,
  author       = {Sarvani S. Vakkalanka and
                  Michael Delisi and
                  Ganesh Gopalakrishnan and
                  Robert M. Kirby and
                  Rajeev Thakur and
                  William Gropp},
  editor       = {Alexey L. Lastovetsky and
                  M. Tahar Kechadi and
                  Jack J. Dongarra},
  title        = {Implementing Efficient Dynamic Formal Verification Methods for {MPI}
                  Programs},
  booktitle    = {Recent Advances in Parallel Virtual Machine and Message Passing Interface,
                  15th European {PVM/MPI} Users' Group Meeting, Dublin, Ireland, September
                  7-10, 2008. Proceedings},
  series       = {Lecture Notes in Computer Science},
  volume       = {5205},
  pages        = {248--256},
  publisher    = {Springer},
  year         = {2008},
  url          = {https://doi.org/10.1007/978-3-540-87475-1\_34},
  doi          = {10.1007/978-3-540-87475-1\_34},
  timestamp    = {Mon, 03 Mar 2025 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/pvm/VakkalankaDGKTG08.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/sc/BynaCSTG08,
  author       = {Surendra Byna and
                  Yong Chen and
                  Xian{-}He Sun and
                  Rajeev Thakur and
                  William Gropp},
  title        = {Parallel {I/O} prefetching using {MPI} file caching and {I/O} signatures},
  booktitle    = {Proceedings of the {ACM/IEEE} Conference on High Performance Computing,
                  {SC} 2008, November 15-21, 2008, Austin, Texas, {USA}},
  pages        = {44},
  publisher    = {{IEEE/ACM}},
  year         = {2008},
  url          = {https://doi.org/10.1109/SC.2008.5213604},
  doi          = {10.1109/SC.2008.5213604},
  timestamp    = {Thu, 14 Oct 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/sc/BynaCSTG08.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/ijhpca/LathamRT07,
  author       = {Robert Latham and
                  Robert B. Ross and
                  Rajeev Thakur},
  title        = {Implementing {MPI-IO} Atomic Mode and Shared File Pointers Using {MPI}
                  One-Sided Communication},
  journal      = {Int. J. High Perform. Comput. Appl.},
  volume       = {21},
  number       = {2},
  pages        = {132--143},
  year         = {2007},
  url          = {https://doi.org/10.1177/1094342007077859},
  doi          = {10.1177/1094342007077859},
  timestamp    = {Thu, 14 Oct 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/ijhpca/LathamRT07.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/pc/GroppT07,
  author       = {William Gropp and
                  Rajeev Thakur},
  title        = {Thread-safety in an {MPI} implementation: Requirements and analysis},
  journal      = {Parallel Comput.},
  volume       = {33},
  number       = {9},
  pages        = {595--604},
  year         = {2007},
  url          = {https://doi.org/10.1016/j.parco.2007.07.002},
  doi          = {10.1016/J.PARCO.2007.07.002},
  timestamp    = {Thu, 14 Oct 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/pc/GroppT07.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/aPcsac/ThakurG07,
  author       = {Rajeev Thakur and
                  William Gropp},
  editor       = {Lynn Choi and
                  Yunheung Paek and
                  Sangyeun Cho},
  title        = {Open Issues in {MPI} Implementation},
  booktitle    = {Advances in Computer Systems Architecture, 12th Asia-Pacific Conference,
                  {ACSAC} 2007, Seoul, Korea, August 23-25, 2007, Proceedings},
  series       = {Lecture Notes in Computer Science},
  volume       = {4697},
  pages        = {327--338},
  publisher    = {Springer},
  year         = {2007},
  url          = {https://doi.org/10.1007/978-3-540-74309-5\_31},
  doi          = {10.1007/978-3-540-74309-5\_31},
  timestamp    = {Tue, 21 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/aPcsac/ThakurG07.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/ipps/BalajiBBSTG07,
  author       = {Pavan Balaji and
                  Darius Buntinas and
                  Satish Balay and
                  Barry F. Smith and
                  Rajeev Thakur and
                  William Gropp},
  title        = {Nonuniformly Communicating Noncontiguous Data: {A} Case Study with
                  PETSc and {MPI}},
  booktitle    = {21th International Parallel and Distributed Processing Symposium {(IPDPS}
                  2007), Proceedings, 26-30 March 2007, Long Beach, California, {USA}},
  pages        = {1--10},
  publisher    = {{IEEE}},
  year         = {2007},
  url          = {https://doi.org/10.1109/IPDPS.2007.370223},
  doi          = {10.1109/IPDPS.2007.370223},
  timestamp    = {Fri, 24 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/ipps/BalajiBBSTG07.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/pvm/GroppT07,
  author       = {William D. Gropp and
                  Rajeev Thakur},
  editor       = {Franck Cappello and
                  Thomas H{\'{e}}rault and
                  Jack J. Dongarra},
  title        = {Revealing the Performance of {MPI} {RMA} Implementations},
  booktitle    = {Recent Advances in Parallel Virtual Machine and Message Passing Interface,
                  14th European {PVM/MPI} User's Group Meeting, Paris, France, September
                  30 - October 3, 2007, Proceedings},
  series       = {Lecture Notes in Computer Science},
  volume       = {4757},
  pages        = {272--280},
  publisher    = {Springer},
  year         = {2007},
  url          = {https://doi.org/10.1007/978-3-540-75416-9\_38},
  doi          = {10.1007/978-3-540-75416-9\_38},
  timestamp    = {Tue, 07 May 2024 20:11:00 +0200},
  biburl       = {https://dblp.org/rec/conf/pvm/GroppT07.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/pvm/LathamGRT07,
  author       = {Robert Latham and
                  William Gropp and
                  Robert B. Ross and
                  Rajeev Thakur},
  editor       = {Franck Cappello and
                  Thomas H{\'{e}}rault and
                  Jack J. Dongarra},
  title        = {Extending the {MPI-2} Generalized Request Interface},
  booktitle    = {Recent Advances in Parallel Virtual Machine and Message Passing Interface,
                  14th European {PVM/MPI} User's Group Meeting, Paris, France, September
                  30 - October 3, 2007, Proceedings},
  series       = {Lecture Notes in Computer Science},
  volume       = {4757},
  pages        = {223--232},
  publisher    = {Springer},
  year         = {2007},
  url          = {https://doi.org/10.1007/978-3-540-75416-9\_33},
  doi          = {10.1007/978-3-540-75416-9\_33},
  timestamp    = {Thu, 14 Oct 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/pvm/LathamGRT07.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/pvm/PervezGKPTG07,
  author       = {Salman Pervez and
                  Ganesh Gopalakrishnan and
                  Robert M. Kirby and
                  Robert Palmer and
                  Rajeev Thakur and
                  William Gropp},
  editor       = {Franck Cappello and
                  Thomas H{\'{e}}rault and
                  Jack J. Dongarra},
  title        = {Practical Model-Checking Method for Verifying Correctness of {MPI}
                  Programs},
  booktitle    = {Recent Advances in Parallel Virtual Machine and Message Passing Interface,
                  14th European {PVM/MPI} User's Group Meeting, Paris, France, September
                  30 - October 3, 2007, Proceedings},
  series       = {Lecture Notes in Computer Science},
  volume       = {4757},
  pages        = {344--353},
  publisher    = {Springer},
  year         = {2007},
  url          = {https://doi.org/10.1007/978-3-540-75416-9\_46},
  doi          = {10.1007/978-3-540-75416-9\_46},
  timestamp    = {Mon, 03 Mar 2025 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/pvm/PervezGKPTG07.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/pvm/ThakurG07,
  author       = {Rajeev Thakur and
                  William Gropp},
  editor       = {Franck Cappello and
                  Thomas H{\'{e}}rault and
                  Jack J. Dongarra},
  title        = {Test Suite for Evaluating Performance of {MPI} Implementations That
                  Support MPI{\_}THREAD{\_}MULTIPLE},
  booktitle    = {Recent Advances in Parallel Virtual Machine and Message Passing Interface,
                  14th European {PVM/MPI} User's Group Meeting, Paris, France, September
                  30 - October 3, 2007, Proceedings},
  series       = {Lecture Notes in Computer Science},
  volume       = {4757},
  pages        = {46--55},
  publisher    = {Springer},
  year         = {2007},
  url          = {https://doi.org/10.1007/978-3-540-75416-9\_13},
  doi          = {10.1007/978-3-540-75416-9\_13},
  timestamp    = {Thu, 14 Oct 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/pvm/ThakurG07.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/pvm/TraffGT07,
  author       = {Jesper Larsson Tr{\"{a}}ff and
                  William Gropp and
                  Rajeev Thakur},
  editor       = {Franck Cappello and
                  Thomas H{\'{e}}rault and
                  Jack J. Dongarra},
  title        = {Self-consistent {MPI} Performance Requirements},
  booktitle    = {Recent Advances in Parallel Virtual Machine and Message Passing Interface,
                  14th European {PVM/MPI} User's Group Meeting, Paris, France, September
                  30 - October 3, 2007, Proceedings},
  series       = {Lecture Notes in Computer Science},
  volume       = {4757},
  pages        = {36--45},
  publisher    = {Springer},
  year         = {2007},
  url          = {https://doi.org/10.1007/978-3-540-75416-9\_12},
  doi          = {10.1007/978-3-540-75416-9\_12},
  timestamp    = {Tue, 21 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/pvm/TraffGT07.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/cluster/ColomaCCLRTW06,
  author       = {Kenin Coloma and
                  Avery Ching and
                  Alok N. Choudhary and
                  Wei{-}keng Liao and
                  Robert B. Ross and
                  Rajeev Thakur and
                  Lee Ward},
  title        = {A New Flexible {MPI} Collective {I/O} Implementation},
  booktitle    = {Proceedings of the 2006 {IEEE} International Conference on Cluster
                  Computing, September 25-28, 2006, Barcelona, Spain},
  publisher    = {{IEEE} Computer Society},
  year         = {2006},
  url          = {https://doi.org/10.1109/CLUSTR.2006.311865},
  doi          = {10.1109/CLUSTR.2006.311865},
  timestamp    = {Sat, 30 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/cluster/ColomaCCLRTW06.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/ipps/LeeRABT06,
  author       = {Jonghyun Lee and
                  Robert B. Ross and
                  Scott Atchley and
                  Micah Beck and
                  Rajeev Thakur},
  title        = {{MPI-IO/L:} efficient remote {I/O} for {MPI-IO} via logistical networking},
  booktitle    = {20th International Parallel and Distributed Processing Symposium {(IPDPS}
                  2006), Proceedings, 25-29 April 2006, Rhodes Island, Greece},
  publisher    = {{IEEE}},
  year         = {2006},
  url          = {https://doi.org/10.1109/IPDPS.2006.1639305},
  doi          = {10.1109/IPDPS.2006.1639305},
  timestamp    = {Fri, 24 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/ipps/LeeRABT06.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/pvm/BynaSTG06,
  author       = {Surendra Byna and
                  Xian{-}He Sun and
                  Rajeev Thakur and
                  William Gropp},
  editor       = {Bernd Mohr and
                  Jesper Larsson Tr{\"{a}}ff and
                  Joachim Worringen and
                  Jack J. Dongarra},
  title        = {Automatic Memory Optimizations for Improving {MPI} Derived Datatype
                  Performance},
  booktitle    = {Recent Advances in Parallel Virtual Machine and Message Passing Interface,
                  13th European {PVM/MPI} User's Group Meeting, Bonn, Germany, September
                  17-20, 2006, Proceedings},
  series       = {Lecture Notes in Computer Science},
  volume       = {4192},
  pages        = {238--246},
  publisher    = {Springer},
  year         = {2006},
  url          = {https://doi.org/10.1007/11846802\_36},
  doi          = {10.1007/11846802\_36},
  timestamp    = {Tue, 21 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/pvm/BynaSTG06.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/pvm/GroppT06,
  author       = {William D. Gropp and
                  Rajeev Thakur},
  editor       = {Bernd Mohr and
                  Jesper Larsson Tr{\"{a}}ff and
                  Joachim Worringen and
                  Jack J. Dongarra},
  title        = {Issues in Developing a Thread-Safe {MPI} Implementation},
  booktitle    = {Recent Advances in Parallel Virtual Machine and Message Passing Interface,
                  13th European {PVM/MPI} User's Group Meeting, Bonn, Germany, September
                  17-20, 2006, Proceedings},
  series       = {Lecture Notes in Computer Science},
  volume       = {4192},
  pages        = {12--21},
  publisher    = {Springer},
  year         = {2006},
  url          = {https://doi.org/10.1007/11846802\_11},
  doi          = {10.1007/11846802\_11},
  timestamp    = {Tue, 21 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/pvm/GroppT06.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/pvm/LathamRT06,
  author       = {Robert Latham and
                  Robert B. Ross and
                  Rajeev Thakur},
  editor       = {Bernd Mohr and
                  Jesper Larsson Tr{\"{a}}ff and
                  Joachim Worringen and
                  Jack J. Dongarra},
  title        = {Can {MPI} Be Used for Persistent Parallel Services?},
  booktitle    = {Recent Advances in Parallel Virtual Machine and Message Passing Interface,
                  13th European {PVM/MPI} User's Group Meeting, Bonn, Germany, September
                  17-20, 2006, Proceedings},
  series       = {Lecture Notes in Computer Science},
  volume       = {4192},
  pages        = {275--284},
  publisher    = {Springer},
  year         = {2006},
  url          = {https://doi.org/10.1007/11846802\_40},
  doi          = {10.1007/11846802\_40},
  timestamp    = {Thu, 14 Oct 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/pvm/LathamRT06.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/pvm/PervezGKTG06,
  author       = {Salman Pervez and
                  Ganesh Gopalakrishnan and
                  Robert M. Kirby and
                  Rajeev Thakur and
                  William D. Gropp},
  editor       = {Bernd Mohr and
                  Jesper Larsson Tr{\"{a}}ff and
                  Joachim Worringen and
                  Jack J. Dongarra},
  title        = {Formal Verification of Programs That Use {MPI} One-Sided Communication},
  booktitle    = {Recent Advances in Parallel Virtual Machine and Message Passing Interface,
                  13th European {PVM/MPI} User's Group Meeting, Bonn, Germany, September
                  17-20, 2006, Proceedings},
  series       = {Lecture Notes in Computer Science},
  volume       = {4192},
  pages        = {30--39},
  publisher    = {Springer},
  year         = {2006},
  url          = {https://doi.org/10.1007/11846802\_13},
  doi          = {10.1007/11846802\_13},
  timestamp    = {Mon, 03 Mar 2025 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/pvm/PervezGKTG06.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/sc/GroppLTR06,
  author       = {William Gropp and
                  Ewing L. Lusk and
                  Rajeev Thakur and
                  Robert B. Ross},
  title        = {{S01} - Advanced {MPI:} {I/O} and one-sided communication},
  booktitle    = {Proceedings of the {ACM/IEEE} {SC2006} Conference on High Performance
                  Networking and Computing, November 11-17, 2006, Tampa, FL, {USA}},
  pages        = {202},
  publisher    = {{ACM} Press},
  year         = {2006},
  url          = {https://doi.org/10.1145/1188455.1188666},
  doi          = {10.1145/1188455.1188666},
  timestamp    = {Thu, 14 Oct 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/sc/GroppLTR06.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/ijhpca/ThakurRG05,
  author       = {Rajeev Thakur and
                  Rolf Rabenseifner and
                  William Gropp},
  title        = {Optimization of Collective Communication Operations in {MPICH}},
  journal      = {Int. J. High Perform. Comput. Appl.},
  volume       = {19},
  number       = {1},
  pages        = {49--66},
  year         = {2005},
  url          = {https://doi.org/10.1177/1094342005051521},
  doi          = {10.1177/1094342005051521},
  timestamp    = {Thu, 14 Oct 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/ijhpca/ThakurRG05.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/ccgrid/RossLGTT05,
  author       = {Robert B. Ross and
                  Robert Latham and
                  William Gropp and
                  Rajeev Thakur and
                  Brian R. Toonen},
  title        = {Implementing {MPI-IO} atomic mode without file system support},
  booktitle    = {5th International Symposium on Cluster Computing and the Grid (CCGrid
                  2005), 9-12 May, 2005, Cardiff, {UK}},
  pages        = {1135--1142},
  publisher    = {{IEEE} Computer Society},
  year         = {2005},
  url          = {https://doi.org/10.1109/CCGRID.2005.1558687},
  doi          = {10.1109/CCGRID.2005.1558687},
  timestamp    = {Sat, 31 May 2025 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/ccgrid/RossLGTT05.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/pvm/GroppT05,
  author       = {William D. Gropp and
                  Rajeev Thakur},
  editor       = {Beniamino Di Martino and
                  Dieter Kranzlm{\"{u}}ller and
                  Jack J. Dongarra},
  title        = {An Evaluation of Implementation Options for {MPI} One-Sided Communication},
  booktitle    = {Recent Advances in Parallel Virtual Machine and Message Passing Interface,
                  12th European {PVM/MPI} Users' Group Meeting, Sorrento, Italy, September
                  18-21, 2005, Proceedings},
  series       = {Lecture Notes in Computer Science},
  volume       = {3666},
  pages        = {415--424},
  publisher    = {Springer},
  year         = {2005},
  url          = {https://doi.org/10.1007/11557265\_53},
  doi          = {10.1007/11557265\_53},
  timestamp    = {Thu, 14 Oct 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/pvm/GroppT05.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/pvm/LathamRTT05,
  author       = {Robert Latham and
                  Robert B. Ross and
                  Rajeev Thakur and
                  Brian R. Toonen},
  editor       = {Beniamino Di Martino and
                  Dieter Kranzlm{\"{u}}ller and
                  Jack J. Dongarra},
  title        = {Implementing {MPI-IO} Shared File Pointers Without File System Support},
  booktitle    = {Recent Advances in Parallel Virtual Machine and Message Passing Interface,
                  12th European {PVM/MPI} Users' Group Meeting, Sorrento, Italy, September
                  18-21, 2005, Proceedings},
  series       = {Lecture Notes in Computer Science},
  volume       = {3666},
  pages        = {84--93},
  publisher    = {Springer},
  year         = {2005},
  url          = {https://doi.org/10.1007/11557265\_15},
  doi          = {10.1007/11557265\_15},
  timestamp    = {Sat, 31 May 2025 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/pvm/LathamRTT05.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/pvm/ThakurRL05,
  author       = {Rajeev Thakur and
                  Robert B. Ross and
                  Robert Latham},
  editor       = {Beniamino Di Martino and
                  Dieter Kranzlm{\"{u}}ller and
                  Jack J. Dongarra},
  title        = {Implementing Byte-Range Locks Using {MPI} One-Sided Communication},
  booktitle    = {Recent Advances in Parallel Virtual Machine and Message Passing Interface,
                  12th European {PVM/MPI} Users' Group Meeting, Sorrento, Italy, September
                  18-21, 2005, Proceedings},
  series       = {Lecture Notes in Computer Science},
  volume       = {3666},
  pages        = {119--128},
  publisher    = {Springer},
  year         = {2005},
  url          = {https://doi.org/10.1007/11557265\_19},
  doi          = {10.1007/11557265\_19},
  timestamp    = {Thu, 14 Oct 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/pvm/ThakurRL05.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/ccgrid/JiangLJPGT04,
  author       = {Weihang Jiang and
                  Jiuxing Liu and
                  Hyun{-}Wook Jin and
                  Dhabaleswar K. Panda and
                  William Gropp and
                  Rajeev Thakur},
  title        = {High performance {MPI-2} one-sided communication over InfiniBand},
  booktitle    = {4th {IEEE/ACM} International Symposium on Cluster Computing and the
                  Grid (CCGrid 2004), April 19-22, 2004, Chicago, Illinois, {USA}},
  pages        = {531--538},
  publisher    = {{IEEE} Computer Society},
  year         = {2004},
  url          = {https://doi.org/10.1109/CCGrid.2004.1336648},
  doi          = {10.1109/CCGRID.2004.1336648},
  timestamp    = {Fri, 24 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/ccgrid/JiangLJPGT04.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/cluster/LeeRTMW04,
  author       = {Jonghyun Lee and
                  Robert B. Ross and
                  Rajeev Thakur and
                  Xiaosong Ma and
                  Marianne Winslett},
  title        = {{RFS:} efficient and flexible remote file access for {MPI-IO}},
  booktitle    = {2004 {IEEE} International Conference on Cluster Computing {(CLUSTER}
                  2004), September 20-23 2004, San Diego, California, {USA}},
  pages        = {71--81},
  publisher    = {{IEEE} Computer Society},
  year         = {2004},
  url          = {https://doi.org/10.1109/CLUSTR.2004.1392604},
  doi          = {10.1109/CLUSTR.2004.1392604},
  timestamp    = {Thu, 23 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/cluster/LeeRTMW04.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/pvm/JiangLJPBTG04,
  author       = {Weihang Jiang and
                  Jiuxing Liu and
                  Hyun{-}Wook Jin and
                  Dhabaleswar K. Panda and
                  Darius Buntinas and
                  Rajeev Thakur and
                  William D. Gropp},
  editor       = {Dieter Kranzlm{\"{u}}ller and
                  P{\'{e}}ter Kacsuk and
                  Jack J. Dongarra},
  title        = {Efficient Implementation of {MPI-2} Passive One-Sided Communication
                  on InfiniBand Clusters},
  booktitle    = {Recent Advances in Parallel Virtual Machine and Message Passing Interface,
                  11th European {PVM/MPI} Users' Group Meeting, Budapest, Hungary, September
                  19-22, 2004, Proceedings},
  series       = {Lecture Notes in Computer Science},
  volume       = {3241},
  pages        = {68--76},
  publisher    = {Springer},
  year         = {2004},
  url          = {https://doi.org/10.1007/978-3-540-30218-6\_16},
  doi          = {10.1007/978-3-540-30218-6\_16},
  timestamp    = {Tue, 21 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/pvm/JiangLJPBTG04.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/pvm/LathamRT04,
  author       = {Robert Latham and
                  Robert B. Ross and
                  Rajeev Thakur},
  editor       = {Dieter Kranzlm{\"{u}}ller and
                  P{\'{e}}ter Kacsuk and
                  Jack J. Dongarra},
  title        = {The Impact of File Systems on {MPI-IO} Scalability},
  booktitle    = {Recent Advances in Parallel Virtual Machine and Message Passing Interface,
                  11th European {PVM/MPI} Users' Group Meeting, Budapest, Hungary, September
                  19-22, 2004, Proceedings},
  series       = {Lecture Notes in Computer Science},
  volume       = {3241},
  pages        = {87--96},
  publisher    = {Springer},
  year         = {2004},
  url          = {https://doi.org/10.1007/978-3-540-30218-6\_18},
  doi          = {10.1007/978-3-540-30218-6\_18},
  timestamp    = {Thu, 14 Oct 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/pvm/LathamRT04.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/pvm/ThakurGT04,
  author       = {Rajeev Thakur and
                  William D. Gropp and
                  Brian R. Toonen},
  editor       = {Dieter Kranzlm{\"{u}}ller and
                  P{\'{e}}ter Kacsuk and
                  Jack J. Dongarra},
  title        = {Minimizing Synchronization Overhead in the Implementation of {MPI}
                  One-Sided Communication},
  booktitle    = {Recent Advances in Parallel Virtual Machine and Message Passing Interface,
                  11th European {PVM/MPI} Users' Group Meeting, Budapest, Hungary, September
                  19-22, 2004, Proceedings},
  series       = {Lecture Notes in Computer Science},
  volume       = {3241},
  pages        = {57--67},
  publisher    = {Springer},
  year         = {2004},
  url          = {https://doi.org/10.1007/978-3-540-30218-6\_15},
  doi          = {10.1007/978-3-540-30218-6\_15},
  timestamp    = {Sat, 31 May 2025 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/pvm/ThakurGT04.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/cluster/BynaGST03,
  author       = {Surendra Byna and
                  William D. Gropp and
                  Xian{-}He Sun and
                  Rajeev Thakur},
  title        = {Improving the Performance of {MPI} Derived Datatypes by Optimizing
                  Memory-Access Cost},
  booktitle    = {2003 {IEEE} International Conference on Cluster Computing {(CLUSTER}
                  2003), 1-4 December 2003, Kowloon, Hong Kong, China},
  pages        = {412--419},
  publisher    = {{IEEE} Computer Society},
  year         = {2003},
  url          = {https://doi.org/10.1109/CLUSTR.2003.1253341},
  doi          = {10.1109/CLUSTR.2003.1253341},
  timestamp    = {Thu, 23 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/cluster/BynaGST03.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/cluster/GroppLRT03,
  author       = {William D. Gropp and
                  Ewing L. Lusk and
                  Robert B. Ross and
                  Rajeev Thakur},
  title        = {Using {MPI-2:} Advanced Features of the Message Passing Interface},
  booktitle    = {2003 {IEEE} International Conference on Cluster Computing {(CLUSTER}
                  2003), 1-4 December 2003, Kowloon, Hong Kong, China},
  publisher    = {{IEEE} Computer Society},
  year         = {2003},
  url          = {https://doi.ieeecomputersociety.org/10.1109/CLUSTER.2003.10010},
  doi          = {10.1109/CLUSTER.2003.10010},
  timestamp    = {Thu, 23 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/cluster/GroppLRT03.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/pvm/ThakurG03,
  author       = {Rajeev Thakur and
                  William Gropp},
  editor       = {Jack J. Dongarra and
                  Domenico Laforenza and
                  Salvatore Orlando},
  title        = {Improving the Performance of Collective Operations in {MPICH}},
  booktitle    = {Recent Advances in Parallel Virtual Machine and Message Passing Interface,10th
                  European {PVM/MPI} Users' Group Meeting, Venice, Italy, September
                  29 - October 2, 2003, Proceedings},
  series       = {Lecture Notes in Computer Science},
  volume       = {2840},
  pages        = {257--267},
  publisher    = {Springer},
  year         = {2003},
  url          = {https://doi.org/10.1007/978-3-540-39924-7\_38},
  doi          = {10.1007/978-3-540-39924-7\_38},
  timestamp    = {Tue, 21 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/pvm/ThakurG03.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/pc/ThakurGL02,
  author       = {Rajeev Thakur and
                  William Gropp and
                  Ewing L. Lusk},
  title        = {Optimizing noncontiguous accesses in {MPI-IO}},
  journal      = {Parallel Comput.},
  volume       = {28},
  number       = {1},
  pages        = {83--105},
  year         = {2002},
  url          = {https://doi.org/10.1016/S0167-8191(01)00129-6},
  doi          = {10.1016/S0167-8191(01)00129-6},
  timestamp    = {Thu, 14 Oct 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/pc/ThakurGL02.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/iopads/ThakurGL99,
  author       = {Rajeev Thakur and
                  William Gropp and
                  Ewing L. Lusk},
  title        = {On Implementing {MPI-IO} Portably and with High Performance},
  booktitle    = {Proceedings of the Sixth Workshop on {I/O} in Parallel and Distributed
                  Systems, {IOPADS} 1999, May 5, 1999, Atlanta, GA, {USA}},
  pages        = {23--32},
  publisher    = {{ACM}},
  year         = {1999},
  url          = {https://doi.org/10.1145/301816.301826},
  doi          = {10.1145/301816.301826},
  timestamp    = {Tue, 21 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/iopads/ThakurGL99.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/sc/ThakurGL98,
  author       = {Rajeev Thakur and
                  William Gropp and
                  Ewing L. Lusk},
  title        = {A Case for Using MPI's Derived Datatypes to Improve {I/O} Performance},
  booktitle    = {Proceedings of the {ACM/IEEE} Conference on Supercomputing, {SC} 1998,
                  November 7-13, 1998, Orlando, FL, {USA}},
  pages        = {1},
  publisher    = {{IEEE} Computer Society},
  year         = {1998},
  url          = {https://doi.org/10.1109/SC.1998.10006},
  doi          = {10.1109/SC.1998.10006},
  timestamp    = {Fri, 24 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/sc/ThakurGL98.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/tpds/WangGBS23,
  author       = {Chen Wang and
                  Yanfei Guo and
                  Pavan Balaji and
                  Marc Snir},
  title        = {Near-Lossless {MPI} Tracing and Proxy Application Autogeneration},
  journal      = {{IEEE} Trans. Parallel Distributed Syst.},
  volume       = {34},
  number       = {1},
  pages        = {123--140},
  year         = {2023},
  url          = {https://doi.org/10.1109/TPDS.2022.3215942},
  doi          = {10.1109/TPDS.2022.3215942},
  timestamp    = {Mon, 05 Dec 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/tpds/WangGBS23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/tpds/ZambreSZBCB21,
  author       = {Rohit Zambre and
                  Damodar Sahasrabudhe and
                  Hui Zhou and
                  Martin Berzins and
                  Aparna Chandramowlishwaran and
                  Pavan Balaji},
  title        = {Logically Parallel Communication for Fast MPI+Threads Applications},
  journal      = {{IEEE} Trans. Parallel Distributed Syst.},
  volume       = {32},
  number       = {12},
  pages        = {3038--3052},
  year         = {2021},
  url          = {https://doi.org/10.1109/TPDS.2021.3075157},
  doi          = {10.1109/TPDS.2021.3075157},
  timestamp    = {Wed, 16 Apr 2025 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/tpds/ZambreSZBCB21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/ccgrid/GhoshGBG21,
  author       = {Sayan Ghosh and
                  Yanfei Guo and
                  Pavan Balaji and
                  Assefaw H. Gebremedhin},
  editor       = {Laurent Lef{\`{e}}vre and
                  Stacy Patterson and
                  Young Choon Lee and
                  Haiying Shen and
                  Shashikant Ilager and
                  Mohammad Goudarzi and
                  Adel Nadjaran Toosi and
                  Rajkumar Buyya},
  title        = {{RMACXX:} An Efficient High-Level {C++} Interface over {MPI-3} {RMA}},
  booktitle    = {21st {IEEE/ACM} International Symposium on Cluster, Cloud and Internet
                  Computing, CCGrid 2021, Melbourne, Australia, May 10-13, 2021},
  pages        = {143--155},
  publisher    = {{IEEE}},
  year         = {2021},
  url          = {https://doi.org/10.1109/CCGrid51090.2021.00024},
  doi          = {10.1109/CCGRID51090.2021.00024},
  timestamp    = {Fri, 06 Aug 2021 11:08:53 +0200},
  biburl       = {https://dblp.org/rec/conf/ccgrid/GhoshGBG21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/cluster/OuyangSHCB21,
  author       = {Kaiming Ouyang and
                  Min Si and
                  Atsushi Hori and
                  Zizhong Chen and
                  Pavan Balaji},
  title        = {Daps: {A} Dynamic Asynchronous Progress Stealing Model for {MPI} Communication},
  booktitle    = {{IEEE} International Conference on Cluster Computing, {CLUSTER} 2021,
                  Portland, OR, USA, September 7-10, 2021},
  pages        = {516--527},
  publisher    = {{IEEE}},
  year         = {2021},
  url          = {https://doi.org/10.1109/Cluster48925.2021.00027},
  doi          = {10.1109/CLUSTER48925.2021.00027},
  timestamp    = {Wed, 01 Jun 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/cluster/OuyangSHCB21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/openshmem/SiFHB21,
  author       = {Min Si and
                  Huansong Fu and
                  Jeff R. Hammond and
                  Pavan Balaji},
  editor       = {Stephen W. Poole and
                  Oscar R. Hernandez and
                  Matthew B. Baker and
                  Tony Curtis},
  title        = {OpenSHMEM over {MPI} as a Performance Contender: Thorough Analysis
                  and Optimizations},
  booktitle    = {OpenSHMEM and Related Technologies. OpenSHMEM in the Era of Exascale
                  and Smart Networks - 8th Workshop on OpenSHMEM and Related Technologies,
                  OpenSHMEM 2021, Virtual Event, September 14-16, 2021, Revised Selected
                  Papers},
  series       = {Lecture Notes in Computer Science},
  volume       = {13159},
  pages        = {39--60},
  publisher    = {Springer},
  year         = {2021},
  url          = {https://doi.org/10.1007/978-3-031-04888-3\_3},
  doi          = {10.1007/978-3-031-04888-3\_3},
  timestamp    = {Fri, 10 Mar 2023 09:48:58 +0100},
  biburl       = {https://dblp.org/rec/conf/openshmem/SiFHB21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/sc/0004BS21,
  author       = {Chen Wang and
                  Pavan Balaji and
                  Marc Snir},
  editor       = {Bronis R. de Supinski and
                  Mary W. Hall and
                  Todd Gamblin},
  title        = {Pilgrim: scalable and (near) lossless {MPI} tracing},
  booktitle    = {International Conference for High Performance Computing, Networking,
                  Storage and Analysis, {SC} 2021, St. Louis, Missouri, USA, November
                  14-19, 2021},
  pages        = {52},
  publisher    = {{ACM}},
  year         = {2021},
  url          = {https://doi.org/10.1145/3458817.3476151},
  doi          = {10.1145/3458817.3476151},
  timestamp    = {Tue, 08 Nov 2022 16:03:02 +0100},
  biburl       = {https://dblp.org/rec/conf/sc/0004BS21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/tpds/GaoGZCLBT20,
  author       = {Tao Gao and
                  Yanfei Guo and
                  Boyu Zhang and
                  Pietro Cicotti and
                  Yutong Lu and
                  Pavan Balaji and
                  Michela Taufer},
  title        = {Memory-Efficient and Skew-Tolerant MapReduce Over {MPI} for Supercomputing
                  Systems},
  journal      = {{IEEE} Trans. Parallel Distributed Syst.},
  volume       = {31},
  number       = {12},
  pages        = {2734--2748},
  year         = {2020},
  url          = {https://doi.org/10.1109/TPDS.2019.2932066},
  doi          = {10.1109/TPDS.2019.2932066},
  timestamp    = {Thu, 27 Jul 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/tpds/GaoGZCLBT20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/ics/ZambreCB20,
  author       = {Rohit Zambre and
                  Aparna Chandramowlishwaran and
                  Pavan Balaji},
  editor       = {Eduard Ayguad{\'{e}} and
                  Wen{-}mei W. Hwu and
                  Rosa M. Badia and
                  H. Peter Hofstee},
  title        = {How {I} learned to stop worrying about user-visible endpoints and
                  love {MPI}},
  booktitle    = {{ICS} '20: 2020 International Conference on Supercomputing, Barcelona
                  Spain, June, 2020},
  pages        = {35:1--35:13},
  publisher    = {{ACM}},
  year         = {2020},
  url          = {https://doi.org/10.1145/3392717.3392773},
  doi          = {10.1145/3392717.3392773},
  timestamp    = {Mon, 03 Jan 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/ics/ZambreCB20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/sc/EvansCOPIRB20,
  author       = {Noah Evans and
                  Jan Ciesko and
                  Stephen L. Olivier and
                  Howard Pritchard and
                  Shintaro Iwasaki and
                  Ken Raffenetti and
                  Pavan Balaji},
  title        = {Implementing Flexible Threading Support in Open {MPI}},
  booktitle    = {Workshop on Exascale MPI, ExaMPI@SC 2020, Atlanta, GA, USA, November
                  13, 2020},
  pages        = {21--30},
  publisher    = {{IEEE}},
  year         = {2020},
  url          = {https://doi.org/10.1109/ExaMPI52011.2020.00008},
  doi          = {10.1109/EXAMPI52011.2020.00008},
  timestamp    = {Thu, 14 Oct 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/sc/EvansCOPIRB20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/sc/OuyangSHCB20,
  author       = {Kaiming Ouyang and
                  Min Si and
                  Atsushi Hori and
                  Zizhong Chen and
                  Pavan Balaji},
  editor       = {Christine Cuicchi and
                  Irene Qualters and
                  William T. Kramer},
  title        = {{CAB-MPI:} exploring interprocess work-stealing towards balanced {MPI}
                  communication},
  booktitle    = {Proceedings of the International Conference for High Performance Computing,
                  Networking, Storage and Analysis, {SC} 2020, Virtual Event / Atlanta,
                  Georgia, USA, November 9-19, 2020},
  pages        = {36},
  publisher    = {{IEEE/ACM}},
  year         = {2020},
  url          = {https://doi.org/10.1109/SC41405.2020.00040},
  doi          = {10.1109/SC41405.2020.00040},
  timestamp    = {Wed, 04 May 2022 13:02:27 +0200},
  biburl       = {https://dblp.org/rec/conf/sc/OuyangSHCB20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/corr/abs-2002-02509,
  author       = {Rohit Zambre and
                  Aparna Chandramowlishwaran and
                  Pavan Balaji},
  title        = {Scalable Communication Endpoints for MPI+Threads Applications},
  journal      = {CoRR},
  volume       = {abs/2002.02509},
  year         = {2020},
  url          = {https://arxiv.org/abs/2002.02509},
  eprinttype    = {arXiv},
  eprint       = {2002.02509},
  timestamp    = {Mon, 10 Feb 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2002-02509.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/corr/abs-2005-00263,
  author       = {Rohit Zambre and
                  Aparna Chandramowlishwaran and
                  Pavan Balaji},
  title        = {How {I} Learned to Stop Worrying About User-Visible Endpoints and
                  Love {MPI}},
  journal      = {CoRR},
  volume       = {abs/2005.00263},
  year         = {2020},
  url          = {https://arxiv.org/abs/2005.00263},
  eprinttype    = {arXiv},
  eprint       = {2005.00263},
  timestamp    = {Fri, 08 May 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2005-00263.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/parco/DavisGCJDDBT19,
  author       = {Joshua Hoke Davis and
                  Tao Gao and
                  Sunita Chandrasekaran and
                  Heike Jagode and
                  Anthony Danalis and
                  Jack J. Dongarra and
                  Pavan Balaji and
                  Michela Taufer},
  editor       = {Ian T. Foster and
                  Gerhard R. Joubert and
                  Ludek Kucera and
                  Wolfgang E. Nagel and
                  Frans J. Peters},
  title        = {Characterization of Power Usage and Performance in Data-Intensive
                  Applications Using MapReduce over {MPI}},
  booktitle    = {Parallel Computing: Technology Trends, Proceedings of the International
                  Conference on Parallel Computing, {PARCO} 2019, Prague, Czech Republic,
                  September 10-13, 2019},
  series       = {Advances in Parallel Computing},
  volume       = {36},
  pages        = {287--298},
  publisher    = {{IOS} Press},
  year         = {2019},
  url          = {https://doi.org/10.3233/APC200053},
  doi          = {10.3233/APC200053},
  timestamp    = {Mon, 01 Feb 2021 08:42:04 +0100},
  biburl       = {https://dblp.org/rec/conf/parco/DavisGCJDDBT19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/topc/AmerLBCWHM18,
  author       = {Abdelhalim Amer and
                  Huiwei Lu and
                  Pavan Balaji and
                  Milind Chabbi and
                  Yanjie Wei and
                  Jeff R. Hammond and
                  Satoshi Matsuoka},
  title        = {Lock Contention Management in Multithreaded {MPI}},
  journal      = {{ACM} Trans. Parallel Comput.},
  volume       = {5},
  number       = {3},
  pages        = {12:1--12:21},
  year         = {2018},
  url          = {https://doi.org/10.1145/3275443},
  doi          = {10.1145/3275443},
  timestamp    = {Sun, 19 Jan 2025 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/topc/AmerLBCWHM18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/tpds/SiPHBTI18,
  author       = {Min Si and
                  Antonio J. Pe{\~{n}}a and
                  Jeff R. Hammond and
                  Pavan Balaji and
                  Masamichi Takagi and
                  Yutaka Ishikawa},
  title        = {Dynamic Adaptable Asynchronous Progress Model for {MPI} {RMA} Multiphase
                  Applications},
  journal      = {{IEEE} Trans. Parallel Distributed Syst.},
  volume       = {29},
  number       = {9},
  pages        = {1975--1989},
  year         = {2018},
  url          = {https://doi.org/10.1109/TPDS.2018.2815568},
  doi          = {10.1109/TPDS.2018.2815568},
  timestamp    = {Sun, 19 Jan 2025 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/tpds/SiPHBTI18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/icpads/GaoGZCLBT18,
  author       = {Tao Gao and
                  Yanfei Guo and
                  Boyu Zhang and
                  Pietro Cicotti and
                  Yutong Lu and
                  Pavan Balaji and
                  Michela Taufer},
  title        = {On the Power of Combiner Optimizations in MapReduce Over {MPI} Workflows},
  booktitle    = {24th {IEEE} International Conference on Parallel and Distributed Systems,
                  {ICPADS} 2018, Singapore, December 11-13, 2018},
  pages        = {441--448},
  publisher    = {{IEEE}},
  year         = {2018},
  url          = {https://doi.org/10.1109/PADSW.2018.8644595},
  doi          = {10.1109/PADSW.2018.8644595},
  timestamp    = {Sat, 05 Sep 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icpads/GaoGZCLBT18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/icpads/ZambreCB18,
  author       = {Rohit Zambre and
                  Aparna Chandramowlishwaran and
                  Pavan Balaji},
  title        = {Scalable Communication Endpoints for MPI+Threads Applications},
  booktitle    = {24th {IEEE} International Conference on Parallel and Distributed Systems,
                  {ICPADS} 2018, Singapore, December 11-13, 2018},
  pages        = {803--812},
  publisher    = {{IEEE}},
  year         = {2018},
  url          = {https://doi.org/10.1109/PADSW.2018.8645059},
  doi          = {10.1109/PADSW.2018.8645059},
  timestamp    = {Sun, 25 Oct 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icpads/ZambreCB18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/sc/ChunduriPBHK18,
  author       = {Sudheer Chunduri and
                  Scott Parker and
                  Pavan Balaji and
                  Kevin Harms and
                  Kalyan Kumaran},
  title        = {Characterization of {MPI} usage on a production supercomputer},
  booktitle    = {Proceedings of the International Conference for High Performance Computing,
                  Networking, Storage, and Analysis, {SC} 2018, Dallas, TX, USA, November
                  11-16, 2018},
  pages        = {30:1--30:15},
  publisher    = {{IEEE} / {ACM}},
  year         = {2018},
  url          = {http://dl.acm.org/citation.cfm?id=3291696},
  timestamp    = {Mon, 12 Nov 2018 09:05:15 +0100},
  biburl       = {https://dblp.org/rec/conf/sc/ChunduriPBHK18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/ccgrid/DangSAB17,
  author       = {Hoang{-}Vu Dang and
                  Sangmin Seo and
                  Abdelhalim Amer and
                  Pavan Balaji},
  title        = {Advanced Thread Synchronization for Multithreaded {MPI} Implementations},
  booktitle    = {Proceedings of the 17th {IEEE/ACM} International Symposium on Cluster,
                  Cloud and Grid Computing, {CCGRID} 2017, Madrid, Spain, May 14-17,
                  2017},
  pages        = {314--324},
  publisher    = {{IEEE} Computer Society / {ACM}},
  year         = {2017},
  url          = {https://doi.org/10.1109/CCGRID.2017.65},
  doi          = {10.1109/CCGRID.2017.65},
  timestamp    = {Fri, 24 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/ccgrid/DangSAB17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/hipc/MirsadeghiTBA17,
  author       = {Seyed Hessam Mirsadeghi and
                  Jesper Larsson Tr{\"{a}}ff and
                  Pavan Balaji and
                  Ahmad Afsahi},
  title        = {Exploiting Common Neighborhoods to Optimize {MPI} Neighborhood Collectives},
  booktitle    = {24th {IEEE} International Conference on High Performance Computing,
                  HiPC 2017, Jaipur, India, December 18-21, 2017},
  pages        = {348--357},
  publisher    = {{IEEE} Computer Society},
  year         = {2017},
  url          = {https://doi.org/10.1109/HiPC.2017.00047},
  doi          = {10.1109/HIPC.2017.00047},
  timestamp    = {Fri, 24 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/hipc/MirsadeghiTBA17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/hpcc/SiB17,
  author       = {Min Si and
                  Pavan Balaji},
  title        = {Process-Based Asynchronous Progress Model for {MPI} Point-to-Point
                  Communication},
  booktitle    = {19th {IEEE} International Conference on High Performance Computing
                  and Communications; 15th {IEEE} International Conference on Smart
                  City; 3rd {IEEE} International Conference on Data Science and Systems,
                  HPCC/SmartCity/DSS 2017, Bangkok, Thailand, December 18-20, 2017},
  pages        = {206--214},
  publisher    = {{IEEE} Computer Society},
  year         = {2017},
  url          = {https://doi.org/10.1109/HPCC-SmartCity-DSS.2017.27},
  doi          = {10.1109/HPCC-SMARTCITY-DSS.2017.27},
  timestamp    = {Wed, 16 Oct 2019 14:14:52 +0200},
  biburl       = {https://dblp.org/rec/conf/hpcc/SiB17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/icpads/LathamBB17,
  author       = {Robert Latham and
                  Leonardo Bautista{-}Gomez and
                  Pavan Balaji},
  title        = {Portable Topology-Aware {MPI-I/O}},
  booktitle    = {23rd {IEEE} International Conference on Parallel and Distributed Systems,
                  {ICPADS} 2017, Shenzhen, China, December 15-17, 2017},
  pages        = {710--719},
  publisher    = {{IEEE} Computer Society},
  year         = {2017},
  url          = {https://doi.org/10.1109/ICPADS.2017.00096},
  doi          = {10.1109/ICPADS.2017.00096},
  timestamp    = {Thu, 23 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icpads/LathamBB17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/cluster/GuoYMZB16,
  author       = {Jichi Guo and
                  Qing Yi and
                  Jiayuan Meng and
                  Junchao Zhang and
                  Pavan Balaji},
  title        = {Compiler-Assisted Overlapping of Communication and Computation in
                  {MPI} Applications},
  booktitle    = {2016 {IEEE} International Conference on Cluster Computing, {CLUSTER}
                  2016, Taipei, Taiwan, September 12-16, 2016},
  pages        = {60--69},
  publisher    = {{IEEE} Computer Society},
  year         = {2016},
  url          = {https://doi.org/10.1109/CLUSTER.2016.62},
  doi          = {10.1109/CLUSTER.2016.62},
  timestamp    = {Thu, 23 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/cluster/GuoYMZB16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/icpp/GhoshHPBGC16,
  author       = {Sayan Ghosh and
                  Jeff R. Hammond and
                  Antonio J. Pe{\~{n}}a and
                  Pavan Balaji and
                  Assefaw Hadish Gebremedhin and
                  Barbara M. Chapman},
  title        = {One-Sided Interface for Matrix Operations Using {MPI-3} {RMA:} {A}
                  Case Study with Elemental},
  booktitle    = {45th International Conference on Parallel Processing, {ICPP} 2016,
                  Philadelphia, PA, USA, August 16-19, 2016},
  pages        = {185--194},
  publisher    = {{IEEE} Computer Society},
  year         = {2016},
  url          = {https://doi.org/10.1109/ICPP.2016.28},
  doi          = {10.1109/ICPP.2016.28},
  timestamp    = {Fri, 24 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icpp/GhoshHPBGC16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/ispdc/ZhaoBG16,
  author       = {Xin Zhao and
                  Pavan Balaji and
                  William Gropp},
  editor       = {Riqing Chen and
                  Chunming Rong and
                  Dan Grigoras},
  title        = {Scalability Challenges in Current {MPI} One-Sided Implementations},
  booktitle    = {15th International Symposium on Parallel and Distributed Computing,
                  {ISPDC} 2016, Fuzhou, China, July 8-10, 2016},
  pages        = {38--47},
  publisher    = {{IEEE} Computer Society},
  year         = {2016},
  url          = {https://doi.org/10.1109/ISPDC.2016.14},
  doi          = {10.1109/ISPDC.2016.14},
  timestamp    = {Fri, 24 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/ispdc/ZhaoBG16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/ccgrid/AmerLBM15,
  author       = {Abdelhalim Amer and
                  Huiwei Lu and
                  Pavan Balaji and
                  Satoshi Matsuoka},
  title        = {Characterizing {MPI} and Hybrid MPI+Threads Applications at Scale:
                  Case Study with {BFS}},
  booktitle    = {15th {IEEE/ACM} International Symposium on Cluster, Cloud and Grid
                  Computing, CCGrid 2015, Shenzhen, China, May 4-7, 2015},
  pages        = {1075--1083},
  publisher    = {{IEEE} Computer Society},
  year         = {2015},
  url          = {https://doi.org/10.1109/CCGrid.2015.93},
  doi          = {10.1109/CCGRID.2015.93},
  timestamp    = {Fri, 24 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/ccgrid/AmerLBM15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/ccgrid/BlandLSB15,
  author       = {Wesley Bland and
                  Huiwei Lu and
                  Sangmin Seo and
                  Pavan Balaji},
  title        = {Lessons Learned Implementing User-Level Failure Mitigation in {MPICH}},
  booktitle    = {15th {IEEE/ACM} International Symposium on Cluster, Cloud and Grid
                  Computing, CCGrid 2015, Shenzhen, China, May 4-7, 2015},
  pages        = {1123--1126},
  publisher    = {{IEEE} Computer Society},
  year         = {2015},
  url          = {https://doi.org/10.1109/CCGrid.2015.51},
  doi          = {10.1109/CCGRID.2015.51},
  timestamp    = {Fri, 24 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/ccgrid/BlandLSB15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/ccgrid/SeoLZB15,
  author       = {Sangmin Seo and
                  Robert Latham and
                  Junchao Zhang and
                  Pavan Balaji},
  title        = {Implementation and Evaluation of {MPI} Nonblocking Collective {I/O}},
  booktitle    = {15th {IEEE/ACM} International Symposium on Cluster, Cloud and Grid
                  Computing, CCGrid 2015, Shenzhen, China, May 4-7, 2015},
  pages        = {1084--1091},
  publisher    = {{IEEE} Computer Society},
  year         = {2015},
  url          = {https://doi.org/10.1109/CCGrid.2015.81},
  doi          = {10.1109/CCGRID.2015.81},
  timestamp    = {Sun, 19 Jan 2025 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/ccgrid/SeoLZB15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/ccgrid/SiPHBI15,
  author       = {Min Si and
                  Antonio J. Pe{\~{n}}a and
                  Jeff R. Hammond and
                  Pavan Balaji and
                  Yutaka Ishikawa},
  title        = {Scaling NWChem with Efficient and Portable Asynchronous Communication
                  in {MPI} {RMA}},
  booktitle    = {15th {IEEE/ACM} International Symposium on Cluster, Cloud and Grid
                  Computing, CCGrid 2015, Shenzhen, China, May 4-7, 2015},
  pages        = {811--816},
  publisher    = {{IEEE} Computer Society},
  year         = {2015},
  url          = {https://doi.org/10.1109/CCGrid.2015.48},
  doi          = {10.1109/CCGRID.2015.48},
  timestamp    = {Fri, 24 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/ccgrid/SiPHBI15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/ccgrid/ZhaoBG15,
  author       = {Xin Zhao and
                  Pavan Balaji and
                  William Gropp},
  title        = {Runtime Support for Irregular Computation in MPI-Based Applications},
  booktitle    = {15th {IEEE/ACM} International Symposium on Cluster, Cloud and Grid
                  Computing, CCGrid 2015, Shenzhen, China, May 4-7, 2015},
  pages        = {701--704},
  publisher    = {{IEEE} Computer Society},
  year         = {2015},
  url          = {https://doi.org/10.1109/CCGrid.2015.82},
  doi          = {10.1109/CCGRID.2015.82},
  timestamp    = {Fri, 24 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/ccgrid/ZhaoBG15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/ccgrid/ZhuZYLZB15,
  author       = {Xiaomin Zhu and
                  Junchao Zhang and
                  Kazutomo Yoshii and
                  Shigang Li and
                  Yunquan Zhang and
                  Pavan Balaji},
  title        = {Analyzing {MPI-3.0} Process-Level Shared Memory: {A} Case Study with
                  Stencil Computations},
  booktitle    = {15th {IEEE/ACM} International Symposium on Cluster, Cloud and Grid
                  Computing, CCGrid 2015, Shenzhen, China, May 4-7, 2015},
  pages        = {1099--1106},
  publisher    = {{IEEE} Computer Society},
  year         = {2015},
  url          = {https://doi.org/10.1109/CCGrid.2015.131},
  doi          = {10.1109/CCGRID.2015.131},
  timestamp    = {Fri, 24 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/ccgrid/ZhuZYLZB15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/hpcc/LuSB15,
  author       = {Huiwei Lu and
                  Sangmin Seo and
                  Pavan Balaji},
  title        = {{MPI+ULT:} Overlapping Communication and Computation with User-Level
                  Threads},
  booktitle    = {17th {IEEE} International Conference on High Performance Computing
                  and Communications, {HPCC} 2015, 7th {IEEE} International Symposium
                  on Cyberspace Safety and Security, {CSS} 2015, and 12th {IEEE} International
                  Conference on Embedded Software and Systems, {ICESS} 2015, New York,
                  NY, USA, August 24-26, 2015},
  pages        = {444--454},
  publisher    = {{IEEE}},
  year         = {2015},
  url          = {https://doi.org/10.1109/HPCC-CSS-ICESS.2015.82},
  doi          = {10.1109/HPCC-CSS-ICESS.2015.82},
  timestamp    = {Wed, 16 Oct 2019 14:14:52 +0200},
  biburl       = {https://dblp.org/rec/conf/hpcc/LuSB15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/ipps/SiPHBTI15,
  author       = {Min Si and
                  Antonio J. Pe{\~{n}}a and
                  Jeff R. Hammond and
                  Pavan Balaji and
                  Masamichi Takagi and
                  Yutaka Ishikawa},
  title        = {Casper: An Asynchronous Progress Model for {MPI} {RMA} on Many-Core
                  Architectures},
  booktitle    = {2015 {IEEE} International Parallel and Distributed Processing Symposium,
                  {IPDPS} 2015, Hyderabad, India, May 25-29, 2015},
  pages        = {665--676},
  publisher    = {{IEEE} Computer Society},
  year         = {2015},
  url          = {https://doi.org/10.1109/IPDPS.2015.35},
  doi          = {10.1109/IPDPS.2015.35},
  timestamp    = {Fri, 24 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/ipps/SiPHBTI15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/ppopp/AmerLWBM15,
  author       = {Abdelhalim Amer and
                  Huiwei Lu and
                  Yanjie Wei and
                  Pavan Balaji and
                  Satoshi Matsuoka},
  editor       = {Albert Cohen and
                  David Grove},
  title        = {MPI+Threads: runtime contention and remedies},
  booktitle    = {Proceedings of the 20th {ACM} {SIGPLAN} Symposium on Principles and
                  Practice of Parallel Programming, PPoPP 2015, San Francisco, CA, USA,
                  February 7-11, 2015},
  pages        = {239--248},
  publisher    = {{ACM}},
  year         = {2015},
  url          = {https://doi.org/10.1145/2688500.2688522},
  doi          = {10.1145/2688500.2688522},
  timestamp    = {Sun, 12 Jun 2022 19:46:08 +0200},
  biburl       = {https://dblp.org/rec/conf/ppopp/AmerLWBM15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/sc/GuoBBZ15,
  author       = {Yanfei Guo and
                  Wesley Bland and
                  Pavan Balaji and
                  Xiaobo Zhou},
  editor       = {Jackie Kern and
                  Jeffrey S. Vetter},
  title        = {Fault tolerant MapReduce-MPI for {HPC} clusters},
  booktitle    = {Proceedings of the International Conference for High Performance Computing,
                  Networking, Storage and Analysis, {SC} 2015, Austin, TX, USA, November
                  15-20, 2015},
  pages        = {34:1--34:12},
  publisher    = {{ACM}},
  year         = {2015},
  url          = {https://doi.org/10.1145/2807591.2807617},
  doi          = {10.1145/2807591.2807617},
  timestamp    = {Tue, 06 Nov 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/sc/GuoBBZ15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/sc/VaidyanathanKPH15,
  author       = {Karthikeyan Vaidyanathan and
                  Dhiraj D. Kalamkar and
                  Kiran Pamnany and
                  Jeff R. Hammond and
                  Pavan Balaji and
                  Dipankar Das and
                  Jongsoo Park and
                  B{\'{a}}lint Jo{\'{o}}},
  editor       = {Jackie Kern and
                  Jeffrey S. Vetter},
  title        = {Improving concurrency and asynchrony in multithreaded {MPI} applications
                  using software offloading},
  booktitle    = {Proceedings of the International Conference for High Performance Computing,
                  Networking, Storage and Analysis, {SC} 2015, Austin, TX, USA, November
                  15-20, 2015},
  pages        = {30:1--30:12},
  publisher    = {{ACM}},
  year         = {2015},
  url          = {https://doi.org/10.1145/2807591.2807602},
  doi          = {10.1145/2807591.2807602},
  timestamp    = {Tue, 06 Nov 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/sc/VaidyanathanKPH15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/ics/SiPBTI14,
  author       = {Min Si and
                  Antonio J. Pe{\~{n}}a and
                  Pavan Balaji and
                  Masamichi Takagi and
                  Yutaka Ishikawa},
  editor       = {Arndt Bode and
                  Michael Gerndt and
                  Per Stenstr{\"{o}}m and
                  Lawrence Rauchwerger and
                  Barton P. Miller and
                  Martin Schulz},
  title        = {{MT-MPI:} multithreaded {MPI} for many-core environments},
  booktitle    = {2014 International Conference on Supercomputing, ICS'14, Muenchen,
                  Germany, June 10-13, 2014},
  pages        = {125--134},
  publisher    = {{ACM}},
  year         = {2014},
  url          = {https://doi.org/10.1145/2597652.2597658},
  doi          = {10.1145/2597652.2597658},
  timestamp    = {Tue, 06 Nov 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/ics/SiPBTI14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/ppopp/YangBMB14,
  author       = {Chaoran Yang and
                  Wesley Bland and
                  John M. Mellor{-}Crummey and
                  Pavan Balaji},
  editor       = {Jos{\'{e}} E. Moreira and
                  James R. Larus},
  title        = {Portable, MPI-interoperable coarray fortran},
  booktitle    = {{ACM} {SIGPLAN} Symposium on Principles and Practice of Parallel Programming,
                  PPoPP '14, Orlando, FL, USA, February 15-19, 2014},
  pages        = {81--92},
  publisher    = {{ACM}},
  year         = {2014},
  url          = {https://doi.org/10.1145/2555243.2555270},
  doi          = {10.1145/2555243.2555270},
  timestamp    = {Sun, 19 Jan 2025 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/ppopp/YangBMB14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/sc/ChenDTBZWHQ14,
  author       = {Zhezhe Chen and
                  James Dinan and
                  Zhen Tang and
                  Pavan Balaji and
                  Hua Zhong and
                  Jun Wei and
                  Tao Huang and
                  Feng Qin},
  editor       = {Trish Damkroger and
                  Jack J. Dongarra},
  title        = {MC-Checker: Detecting Memory Consistency Errors in {MPI} One-Sided
                  Applications},
  booktitle    = {International Conference for High Performance Computing, Networking,
                  Storage and Analysis, {SC} 2014, New Orleans, LA, USA, November 16-21,
                  2014},
  pages        = {499--510},
  publisher    = {{IEEE} Computer Society},
  year         = {2014},
  url          = {https://doi.org/10.1109/SC.2014.46},
  doi          = {10.1109/SC.2014.46},
  timestamp    = {Fri, 24 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/sc/ChenDTBZWHQ14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/sc/ZounmevoZBGA14,
  author       = {Judicael A. Zounmevo and
                  Xin Zhao and
                  Pavan Balaji and
                  William Gropp and
                  Ahmad Afsahi},
  editor       = {Trish Damkroger and
                  Jack J. Dongarra},
  title        = {Nonblocking Epochs in {MPI} One-Sided Communication},
  booktitle    = {International Conference for High Performance Computing, Networking,
                  Storage and Analysis, {SC} 2014, New Orleans, LA, USA, November 16-21,
                  2014},
  pages        = {475--486},
  publisher    = {{IEEE} Computer Society},
  year         = {2014},
  url          = {https://doi.org/10.1109/SC.2014.44},
  doi          = {10.1109/SC.2014.44},
  timestamp    = {Fri, 24 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/sc/ZounmevoZBGA14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/hpcc/BalajiK13,
  author       = {Pavan Balaji and
                  Dries Kimpe},
  title        = {On the Reproducibility of {MPI} Reduction Operations},
  booktitle    = {10th {IEEE} International Conference on High Performance Computing
                  and Communications {\&} 2013 {IEEE} International Conference on Embedded
                  and Ubiquitous Computing, {HPCC/EUC} 2013, Zhangjiajie, China, November
                  13-15, 2013},
  pages        = {407--414},
  publisher    = {{IEEE}},
  year         = {2013},
  url          = {https://doi.org/10.1109/HPCC.and.EUC.2013.65},
  doi          = {10.1109/HPCC.AND.EUC.2013.65},
  timestamp    = {Wed, 16 Oct 2019 14:14:52 +0200},
  biburl       = {https://dblp.org/rec/conf/hpcc/BalajiK13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/icpp/HaqueYDB13,
  author       = {Md. Ziaul Haque and
                  Qing Yi and
                  James Dinan and
                  Pavan Balaji},
  title        = {Enhancing Performance Portability of {MPI} Applications through Annotation-Based
                  Transformations},
  booktitle    = {42nd International Conference on Parallel Processing, {ICPP} 2013,
                  Lyon, France, October 1-4, 2013},
  pages        = {631--640},
  publisher    = {{IEEE} Computer Society},
  year         = {2013},
  url          = {https://doi.org/10.1109/ICPP.2013.77},
  doi          = {10.1109/ICPP.2013.77},
  timestamp    = {Fri, 24 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icpp/HaqueYDB13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/ipps/DinanBHKT12,
  author       = {James Dinan and
                  Pavan Balaji and
                  Jeff R. Hammond and
                  Sriram Krishnamoorthy and
                  Vinod Tipparaju},
  title        = {Supporting the Global Arrays {PGAS} Model Using {MPI} One-Sided Communication},
  booktitle    = {26th {IEEE} International Parallel and Distributed Processing Symposium,
                  {IPDPS} 2012, Shanghai, China, May 21-25, 2012},
  pages        = {739--750},
  publisher    = {{IEEE} Computer Society},
  year         = {2012},
  url          = {https://doi.org/10.1109/IPDPS.2012.72},
  doi          = {10.1109/IPDPS.2012.72},
  timestamp    = {Fri, 24 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/ipps/DinanBHKT12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/hipc/WangYCTBB11,
  author       = {Rui Wang and
                  Erlin Yao and
                  Mingyu Chen and
                  Guangming Tan and
                  Pavan Balaji and
                  Darius Buntinas},
  title        = {Building algorithmically nonstop fault tolerant {MPI} programs},
  booktitle    = {18th International Conference on High Performance Computing, HiPC
                  2011, Bengaluru, India, December 18-21, 2011},
  pages        = {1--9},
  publisher    = {{IEEE} Computer Society},
  year         = {2011},
  url          = {https://doi.org/10.1109/HiPC.2011.6152716},
  doi          = {10.1109/HIPC.2011.6152716},
  timestamp    = {Fri, 24 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/hipc/WangYCTBB11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/pvm/DinanKBHKTV11,
  author       = {James Dinan and
                  Sriram Krishnamoorthy and
                  Pavan Balaji and
                  Jeff R. Hammond and
                  Manojkumar Krishnan and
                  Vinod Tipparaju and
                  Abhinav Vishnu},
  editor       = {Yiannis Cotronis and
                  Anthony Danalis and
                  Dimitrios S. Nikolopoulos and
                  Jack J. Dongarra},
  title        = {Noncollective Communicator Creation in {MPI}},
  booktitle    = {Recent Advances in the Message Passing Interface - 18th European {MPI}
                  Users' Group Meeting, EuroMPI 2011, Santorini, Greece, September 18-21,
                  2011. Proceedings},
  series       = {Lecture Notes in Computer Science},
  volume       = {6960},
  pages        = {282--291},
  publisher    = {Springer},
  year         = {2011},
  url          = {https://doi.org/10.1007/978-3-642-24449-0\_32},
  doi          = {10.1007/978-3-642-24449-0\_32},
  timestamp    = {Tue, 14 May 2019 10:00:52 +0200},
  biburl       = {https://dblp.org/rec/conf/pvm/DinanKBHKTV11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/pvm/RashtiGBAG11,
  author       = {Mohammad J. Rashti and
                  Jonathan Green and
                  Pavan Balaji and
                  Ahmad Afsahi and
                  William Gropp},
  editor       = {Yiannis Cotronis and
                  Anthony Danalis and
                  Dimitrios S. Nikolopoulos and
                  Jack J. Dongarra},
  title        = {Multi-core and Network Aware {MPI} Topology Functions},
  booktitle    = {Recent Advances in the Message Passing Interface - 18th European {MPI}
                  Users' Group Meeting, EuroMPI 2011, Santorini, Greece, September 18-21,
                  2011. Proceedings},
  series       = {Lecture Notes in Computer Science},
  volume       = {6960},
  pages        = {50--60},
  publisher    = {Springer},
  year         = {2011},
  url          = {https://doi.org/10.1007/978-3-642-24449-0\_8},
  doi          = {10.1007/978-3-642-24449-0\_8},
  timestamp    = {Mon, 05 Jun 2017 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/pvm/RashtiGBAG11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/sc/DinanBHKT11,
  author       = {James Dinan and
                  Pavan Balaji and
                  Jeff R. Hammond and
                  Sriram Krishnamoorthy and
                  Vinod Tipparaju},
  editor       = {Scott A. Lathrop and
                  Jim Costa and
                  William Kramer},
  title        = {Poster: High-level, one-sided programming models on {MPI:} a case
                  study with global arrays and NWChem},
  booktitle    = {Conference on High Performance Computing Networking, Storage and Analysis
                  - Companion Volume, {SC} 2011, Seattle, WA, USA, November 12-18, 2011},
  pages        = {37--38},
  publisher    = {{ACM}},
  year         = {2011},
  url          = {https://doi.org/10.1145/2148600.2148620},
  doi          = {10.1145/2148600.2148620},
  timestamp    = {Fri, 03 Jul 2020 08:57:24 +0200},
  biburl       = {https://dblp.org/rec/conf/sc/DinanBHKT11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

