{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2024,9,7]],"date-time":"2024-09-07T16:32:16Z","timestamp":1725726736349},"reference-count":36,"publisher":"IEEE","license":[{"start":{"date-parts":[[2019,12,1]],"date-time":"2019-12-01T00:00:00Z","timestamp":1575158400000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"},{"start":{"date-parts":[[2019,12,1]],"date-time":"2019-12-01T00:00:00Z","timestamp":1575158400000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2019,12,1]],"date-time":"2019-12-01T00:00:00Z","timestamp":1575158400000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2019,12]]},"DOI":"10.1109\/hipc.2019.00041","type":"proceedings-article","created":{"date-parts":[[2020,2,14]],"date-time":"2020-02-14T09:36:22Z","timestamp":1581672982000},"page":"267-276","source":"Crossref","is-referenced-by-count":4,"title":["High-Performance Adaptive MPI Derived Datatype Communication for Modern Multi-GPU Systems"],"prefix":"10.1109","author":[{"given":"Ching-Hsiang","family":"Chu","sequence":"first","affiliation":[]},{"given":"Jahanzeb Maqbool","family":"Hashmi","sequence":"additional","affiliation":[]},{"given":"Kawthar Shafie","family":"Khorassani","sequence":"additional","affiliation":[]},{"given":"Hari","family":"Subramoni","sequence":"additional","affiliation":[]},{"given":"Dhabaleswar K.","family":"Panda","sequence":"additional","affiliation":[]}],"member":"263","reference":[{"key":"ref33","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-642-24449-0_18"},{"journal-title":"halo exchange use cases code for benchmarking using GCL","year":"2015","key":"ref32"},{"journal-title":"A generic library for stencil computations","year":"2012","author":"bianco","key":"ref31"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-58667-0_18"},{"key":"ref36","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-642-03770-2_11"},{"key":"ref35","first-page":"14","article-title":"High performance implementation of MPI derived datatype communication over InfiniBand","author":"wu","year":"2004","journal-title":"18th International Parallel and Distributed Processing Symposium 2004 Proceedings"},{"key":"ref34","first-page":"412","article-title":"Improving the performance of MPI derived datatypes by optimizing memory-access cost","author":"gropp","year":"2003","journal-title":"2003 Proceedings IEEE International Conference on Cluster Computing"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/CLUSTER.2011.42"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1109\/CLUSTER.2012.72"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1109\/TPDS.2013.234"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1109\/ICPP.2014.31"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1145\/2907294.2907317"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1109\/IPDPS.2016.99"},{"journal-title":"MVAPICH2 High Performance MPI over InfiniBand 10GigE\/iWARP and RoCE","year":"2019","key":"ref16"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-540-30218-6_19"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1109\/IPDPS.2019.00045"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-540-30218-6_14"},{"journal-title":"A fast GPU memory copy library based on NVIDIA GPUDirect RDMA technology","year":"2019","key":"ref28"},{"key":"ref4","first-page":"188","article-title":"High Performance Computing","author":"stone","year":"2016","journal-title":"Early Experiences Porting the NAMD and VMD Molecular Simulation and Analysis Software to GPU-Accelerated OpenPOWER Platforms"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1007\/3-540-48158-3_14"},{"article-title":"Top 500 Supercomputer sites","year":"2019","author":"strohmaier","key":"ref3"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1109\/SC.2018.00054"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1109\/IPDPS.2019.00034"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.5194\/gmd-11-1665-2018"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1109\/SC.2008.5213210"},{"journal-title":"Message Passing Interface Forum","year":"2019","key":"ref7"},{"journal-title":"NVIDIA DGX-2","year":"2019","key":"ref2"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1109\/CLUSTER.2013.6702619"},{"journal-title":"Whitepaper NVIDIA Tesla P100 section ‘NVLink High Speed Interconnect’","year":"2019","key":"ref1"},{"journal-title":"NVIDIA GPUDirect","year":"2019","key":"ref20"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1109\/HiPC.2014.7116873"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1109\/IPDPSW.2012.228"},{"journal-title":"NVIDIA profiling tools","year":"0","key":"ref24"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1109\/TPDS.2018.2867222"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-642-33518-1_17"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1109\/CCGrid.2016.111"}],"event":{"name":"2019 IEEE 26th International Conference on High Performance Computing, Data, and Analytics (HiPC)","start":{"date-parts":[[2019,12,17]]},"location":"Hyderabad, India","end":{"date-parts":[[2019,12,20]]}},"container-title":["2019 IEEE 26th International Conference on High Performance Computing, Data, and Analytics (HiPC)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/8970174\/8990379\/08990650.pdf?arnumber=8990650","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,7,18]],"date-time":"2022-07-18T15:34:21Z","timestamp":1658158461000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/8990650\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2019,12]]},"references-count":36,"URL":"http:\/\/dx.doi.org\/10.1109\/hipc.2019.00041","relation":{},"subject":[],"published":{"date-parts":[[2019,12]]}}}