{"created":"2023-09-20T08:09:37.629515+00:00","id":6374,"links":{},"metadata":{"_buckets":{"deposit":"cd52946d-2ace-4c67-88ea-102c4c7633c7"},"_deposit":{"created_by":7,"id":"6374","owners":[7],"pid":{"revision_id":0,"type":"depid","value":"6374"},"status":"published"},"_oai":{"id":"oai:nied-repo.bosai.go.jp:00006374","sets":[]},"author_link":[],"item_10001_biblio_info_7":{"attribute_name":"書誌情報","attribute_value_mlt":[{"bibliographicIssueDates":{"bibliographicIssueDate":"2012-05-23","bibliographicIssueDateType":"Issued"},"bibliographicIssueNumber":"2-3","bibliographicPageEnd":"155","bibliographicPageStart":"147","bibliographicVolumeNumber":"28","bibliographic_titles":[{"bibliographic_title":"Computer Science - Research and Development","bibliographic_titleLang":"ja"},{"bibliographic_title":"COMPUTER SCIENCE-RESEARCH AND DEVELOPMENT","bibliographic_titleLang":"en"}]}]},"item_10001_description_5":{"attribute_name":"抄録","attribute_value_mlt":[{"subitem_description":"This paper proposes the design of ultra scalable MPI collective communication for the K computer, which consists of 82,944 computing nodes and is the world's first system over 10 PFLOPS. The nodes are connected by a Tofu interconnect that introduces six dimensional mesh/torus topology. Existing MPI libraries, however, perform poorly on such a direct network system since they assume typical cluster environments. Thus, we design collective algorithms optimized for the K computer.On the design of the algorithms, we place importance on collision-freeness for long messages and low latency for short messages. The long-message algorithms use multiple RDMA network interfaces and consist of neighbor communication in order to gain high bandwidth and avoid message collisions. On the other hand, the short-message algorithms are designed to reduce software overhead, which comes from the number of relaying nodes. The evaluation results on up to 55,296 nodes of the K computer show the new implementation outperforms the existing one for long messages by a factor of 4 to 11 times. It also shows the short-message algorithms complement the long-message ones.","subitem_description_language":"en","subitem_description_type":"Other"}]},"item_10001_publisher_8":{"attribute_name":"出版者","attribute_value_mlt":[{"subitem_publisher":"Springer Science and Business Media LLC","subitem_publisher_language":"ja"},{"subitem_publisher":"SPRINGER HEIDELBERG","subitem_publisher_language":"en"}]},"item_10001_relation_14":{"attribute_name":"DOI","attribute_value_mlt":[{"subitem_relation_type_id":{"subitem_relation_type_id_text":"10.1007/s00450-012-0211-7"}}]},"item_10001_source_id_9":{"attribute_name":"ISSN","attribute_value_mlt":[{"subitem_source_identifier":"1865-2042","subitem_source_identifier_type":"EISSN"}]},"item_creator":{"attribute_name":"著者","attribute_type":"creator","attribute_value_mlt":[{"creatorNames":[{"creatorName":"Tomoya Adachi","creatorNameLang":"ja"},{"creatorName":"Tomoya Adachi","creatorNameLang":"en"}]},{"creatorNames":[{"creatorName":"Naoyuki Shida","creatorNameLang":"ja"},{"creatorName":"Naoyuki Shida","creatorNameLang":"en"}]},{"creatorNames":[{"creatorName":"Kenichi Miura","creatorNameLang":"ja"},{"creatorName":"Kenichi Miura","creatorNameLang":"en"}]},{"creatorNames":[{"creatorName":"Shinji Sumimoto","creatorNameLang":"ja"},{"creatorName":"Shinji Sumimoto","creatorNameLang":"en"}]},{"creatorNames":[{"creatorName":"Atsuya Uno","creatorNameLang":"ja"},{"creatorName":"Atsuya Uno","creatorNameLang":"en"}]},{"creatorNames":[{"creatorName":"Motoyoshi Kurokawa","creatorNameLang":"ja"},{"creatorName":"Motoyoshi Kurokawa","creatorNameLang":"en"}]},{"creatorNames":[{"creatorName":"Fumiyoshi Shoji","creatorNameLang":"ja"},{"creatorName":"Fumiyoshi Shoji","creatorNameLang":"en"}]},{"creatorNames":[{"creatorName":"Mitsuo Yokokawa","creatorNameLang":"ja"},{"creatorName":"Mitsuo Yokokawa","creatorNameLang":"en"}]}]},"item_language":{"attribute_name":"言語","attribute_value_mlt":[{"subitem_language":"eng"}]},"item_title":"The design of ultra scalable MPI collective communication on the K computer","item_titles":{"attribute_name":"タイトル","attribute_value_mlt":[{"subitem_title":"The design of ultra scalable MPI collective communication on the K computer","subitem_title_language":"ja"},{"subitem_title":"The design of ultra scalable MPI collective communication on the K computer","subitem_title_language":"en"}]},"item_type_id":"40001","owner":"7","path":["1670839190650"],"pubdate":{"attribute_name":"PubDate","attribute_value":"2023-09-20"},"publish_date":"2023-09-20","publish_status":"0","recid":"6374","relation_version_is_last":true,"title":["The design of ultra scalable MPI collective communication on the K computer"],"weko_creator_id":"7","weko_shared_id":-1},"updated":"2023-09-20T08:09:40.336173+00:00"}