@book{CTT100790651, author = {Toshio Endo and Hiroko Midorikawa and Yukinori Sato.}, title = {Software Technology That Deals with Deeper Memory Hierarchy in Post-petascale Era.}, publisher = {Springer}, year = 2019, } @article{CTT100893936, author = {William S. Moses and Ivan R. Ivanov and Jens Domke and Toshio Endo and Johannes Doerfert and Oleksandr Zinenko}, title = {High-Performance GPU-to-CPU Transpilation and Optimization via High-Level Parallel Constructs}, journal = {arXiv}, year = 2023, } @article{CTT100787688, author = {Yukinori Sato and Tomoya Yuki and Toshio Endo.}, title = {An Autotuning Framework for Scalable Execution of Tiled Code via Iterative Polyhedral Compilation.}, journal = {ACM Transactions on Architecture and Code Optimization (TACO). Volume 15, Issue 4, Article No. 67, 23 pages.}, year = 2019, } @article{CTT100711319, author = {Katsuki Fujisawa and Toyotaro Suzumura and Hitoshi Sato and Koji Ueno and Yuichiro Yasui and Keita Iwabuchi and Toshio Endo}, title = {Advanced Computing & Optimization Infrastructure for Extremely Large-Scale Graphs on Post Peta-Scale Supercomputers}, journal = {Optimization in the Real World - Toward Solving Real-World Optimization Problems -, Series of Mathematics for Industry}, year = 2016, } @article{CTT100813033, author = {高嵜 祐樹 and 遠藤敏夫 and 松岡 聡}, title = {GPU搭載システムにおける都市気流シミュレーションの大規模化と性能モデル}, journal = {情報処理学会研究報告. [ハイパフォーマンスコンピューティング]}, year = 2015, } @article{CTT100632832, author = {遠藤 敏夫 and 額田 彰 and 松岡 聡}, title = {スーパーコンピュータTSUBAME 2.0 における Linpack 性能1 ペタフロップス超の達成}, journal = {情報処理学会論文誌コンピューティングシステム}, year = 2011, } @article{CTT100812644, author = {遠藤敏夫}, title = {GPGPUと東工大TSUBAME2.0スパコン}, journal = {電子情報通信学会ソサイエティ大会講演論文集}, year = 2011, } @article{CTT100617859, author = {遠藤 敏夫 and 額田 彰 and 松岡 聡}, title = {異種アクセラレータを持つTSUBAMEスーパーコンピュータのLinpack評価}, journal = {応用数理}, year = 2010, } @article{CTT100596765, author = {滝澤真一朗 and 遠藤敏夫 and 松岡聡}, title = {次世代光インターコネクトでのMPI通信に関する研究}, journal = {コンピュータソフトウェア}, year = 2009, } @article{CTT100596769, author = {滝澤真一朗 and 遠藤敏夫 and 松岡聡}, title = {光サーキットネットワークの補助的利用によるHPCアプリケーション性能向上}, journal = {情報処理学会 コンピューティングシステム(ACS)}, year = 2009, } @article{CTT100574009, author = {額田彰 and 尾形泰彦 and 遠藤敏夫 and 松岡聡}, title = {CUDA 環境における高性能3次元FFT}, journal = {情報処理学会論文誌コンピューティングシステム}, year = 2008, } @article{CTT100574008, author = {尾形泰彦 and 遠藤敏夫 and 丸山直也 and 松岡聡}, title = {性能モデルに基づくCPU及びGPUを併用する効率的なFFTライブラリ}, journal = {情報処理学会論文誌コンピューティングシステム}, year = 2008, } @article{CTT100600633, author = {遠藤敏夫 and 松岡聡 and 橋爪信明 and 長坂真路}, title = {ヘテロ型スーパーコンピュータTSUBAMEのLinpackによる性能評価}, journal = {情報処理学会論文誌コンピューティングシステム}, year = 2007, } @article{CTT100576057, author = {千葉立寛 and 遠藤敏夫 and 松岡聡}, title = {グリッド環境におけるマルチレーンを用いたMPIコレクティブ通信アルゴリズム}, journal = {情報処理学会論文誌コンピューティングシステム}, year = 2007, } @inproceedings{CTT100911731, author = {Futa Kambe and Toshio Endo}, title = {Accelerating Stencil Computations on a GPU by Combining Using Tensor Cores and Temporal Blocking}, booktitle = {proceedings of Workshop on General Purpose Processing using GPU (GPGPU 2024)}, year = 2024, } @inproceedings{CTT100908559, author = {Ivan Radanov Ivanov and Oleksandr Zinenko and Jens Domke and Toshio Endo and William S. Moses}, title = {Retargeting and Respecializing GPU Workloads for Performance Portability}, booktitle = {proceedings of The International Symposium on Code Generation and Optimization (CGO 2024)}, year = 2024, } @inproceedings{CTT100911730, author = {Ivan Radanov Ivanov and Jens Domke and Toshio Endo and Johannes Doerfert}, title = {Automatic Parallelization and OpenMP Offloading of Fortran}, booktitle = {proceedings of LLVM Performance Workshop}, year = 2024, } @inproceedings{CTT100908558, author = {Ryubu Hosoki and Toshio Endo and Takahiro Hirofuchi and Tsutomu Ikegami}, title = {AshPipe: Asynchronous Hybrid Pipeline Parallel for DNN Training}, booktitle = {proceedings of The International Conference on High Performance Computing in Asia-Pacific Region (HPC Asia 2024)}, year = 2024, } @inproceedings{CTT100908557, author = {Shohei Minami and Toshio Endo and Akihiro Nomura}, title = {The Aggressive Oversubscribing Scheduling for Interactive Jobs on a Supercomputing System}, booktitle = {proceedings of IEEE High Performance Extreme Computing Conference (HPEC 2023)}, year = 2023, } @inproceedings{CTT100908561, author = {岡本 洸琉 and 遠藤 敏夫}, title = {動的スケジューリングライブラリを用いたPythonにおける分散コレスキー分解の実装と評価}, booktitle = {情報処理学会研究報告}, year = 2023, } @inproceedings{CTT100908556, author = {Chenyu Wang and Toshio Endo and Takahiro Hirofuchi and Tsutomu Ikegami}, title = {Pyramid Swin Transformer for Multi-Task: Expanding to More Computer Vision Tasks}, booktitle = {proceedings of Conference on Advanced Concepts for Intelligent Vision Systems (ACIVS 2023)}, year = 2023, } @inproceedings{CTT100908560, author = {神戸 風太 and 遠藤 敏夫}, title = {GPU上のTensor coreを使ったステンシル計算の時間ブロッキングによる高速化}, booktitle = {情報処理学会研究報告}, year = 2023, } @inproceedings{CTT100911732, author = {Hayato Fujita and Akihiro Nomura and Toshio Endo and Masakazu Sekijima}, title = {Enhancing the Performance of AlphaFold Through Modified Storage Method and Optimization of HHblits on TSUBAME3.0 Supercomputer}, booktitle = {proceedings of 2023 Congress in Computer Science, Computer Engineering, & Applied Computing (CSCE)}, year = 2023, } @inproceedings{CTT100908554, author = {Lingqi Zhang and Mohamed Wahib and Peng Chen and Jintao Meng and Xiao Wang and Toshio Endo and Satoshi Matsuoka}, title = {Revisiting Temporal Blocking Stencil Optimizations}, booktitle = {proceedings of ACM International Conference on Supercomputing (ICS 2023)}, year = 2023, } @inproceedings{CTT100908555, author = {Lingqi Zhang and Mohamed Wahib and Peng Chen and Jintao Meng and Xiao Wang and Toshio Endo and Satoshi Matsuoka}, title = {PERKS: a Locality-Optimized Execution Model for Iterative Memory-bound GPU Applications}, booktitle = {proceedings of ACM International Conference on Supercomputing (ICS 2023)}, year = 2023, } @inproceedings{CTT100893955, author = {幸 朋矢 and 遠藤 敏夫}, title = {次世代高性能メモリシステムにおけるステンシル計算の局所性向上技術の評価}, booktitle = {情報処理学会研究報告}, year = 2023, } @inproceedings{CTT100893934, author = {William S. Moses and Ivan Radanov Ivanov and Jens Domke and Toshio Endo and Johannes Doerfert and Oleksandr Zinenko}, title = {High-Performance GPU-to-CPU Transpilation and Optimization via High-Level Parallel Constructs}, booktitle = {proceedings of ACM SIGPLAN Symposium on Principles and Practice of Parallel Programming (PPoPP 2023)}, year = 2023, } @inproceedings{CTT100893932, author = {Lingqi Zhang and Mohamed Wahib and Peng Chen and Jintao Meng and Xiao Wang and Toshio Endo and Satoshi Matsuoka}, title = {Exploiting Scratchpad Memory for Deep Temporal Blocking}, booktitle = {proceedings of the 15th Workshop on General Purpose Processing Using GPU (GPGPU 2023)}, year = 2023, } @inproceedings{CTT100893929, author = {Chenyu Wang and Toshio Endo and Takahiro Hirofuchi and Tsutomu Ikegami}, title = {Pyramid Swin Transformer: Different-Size Windows Swin Transformer for Image Classification and Object Detection}, booktitle = {Proceedings of the 18th International Joint Conference on Computer Vision, Imaging and Computer Graphics Theory and Applications}, year = 2023, } @inproceedings{CTT100891140, author = {Shohei Minami and Toshio Endo and Akihiro Nomura}, title = {Effectiveness of the Oversubscribing Scheduling on Supercomputer Systems}, booktitle = {HPC Asia '23: Proceedings of the International Conference on High Performance Computing in Asia-Pacific Region}, year = 2023, } @inproceedings{CTT100893928, author = {Hiroki Aikawa and Toshio Endo and Tomoya Yuki and Takahiro Hirofuchi and Tsutomu Ikegami}, title = {Efficient Stencil Computation with Temporal Blocking by Halide DSL}, booktitle = {proceedings of 20th IEEE International Symposium on Parallel and Distributed Processing with Applications (ISPA)}, year = 2022, } @inproceedings{CTT100893940, author = {Lingqi Zhang and Mohamed Wahib and Peng Chen and Jintao Meng and Xiao Wang and Toshio Endo and Satoshi Matsuoka}, title = {Breaking the Memory Bottleneck for Iterative Memory-bound Applications Via Persistent Kernels}, booktitle = {IPSJ SIG Technical Report}, year = 2022, } @inproceedings{CTT100893954, author = {萩原 汐 and 吉川 隆英 and 幸 朋矢 and 遠藤 敏夫}, title = {3D Stacked SRAMを活用したHPC向けメモリアーキテクチャの検討}, booktitle = {情報処理学会研究報告}, year = 2022, } @inproceedings{CTT100893951, author = {瓜生 侑 and 遠藤 敏夫}, title = {ラムダ式を用いる移植性の高い並列プログラムの実装とCPU・GPU上の評価}, booktitle = {情報処理学会研究報告}, year = 2022, } @inproceedings{CTT100893927, author = {Chenyu Wang and Toshio Endo and Takahiro Hirofuchi and Tsutomu Ikegami}, title = {Speed-up Single Shot Detector on GPU with CUDA}, booktitle = {Studies in Computational Intelligence}, year = 2022, } @inproceedings{CTT100882932, author = {大沢 泰生 and 遠藤 敏夫 and 野村 哲弘}, title = {タンパク質構造解析システムAlphafoldの実行時ファイルステージングを用いた高速化}, booktitle = {情報処理学会研究報告}, year = 2022, } @inproceedings{CTT100893952, author = {細木 隆豊 and 遠藤 敏夫 and 広渕 崇宏 and 池上 努}, title = {負荷分散を改善したハイブリッドパイプライン並列深層学習手法}, booktitle = {情報処理学会研究報告}, year = 2022, } @inproceedings{CTT100869007, author = {藤田 隼斗 and 野村 哲弘 and 遠藤 敏夫 and 関嶋 政和}, title = {タンパク質立体構造予測システム AlphaFold の TSUBAME3.0 上での高速化}, booktitle = {情報処理学会研究報告}, year = 2022, } @inproceedings{CTT100866033, author = {萩原 汐 and 児玉 宏喜 and 吉川 隆英 and 幸 朋矢 and 遠藤 敏夫}, title = {疎行列演算高速化のためのメモリアーキテクチャ探索}, booktitle = {}, year = 2022, } @inproceedings{CTT100866020, author = {幸 朋矢 and 遠藤 敏夫}, title = {次世代高性能計算ノードにむけたメモリアーキテクチャ探索のためのツールチェーン .}, booktitle = {}, year = 2022, } @inproceedings{CTT100866019, author = {Ivan Ivanov and Jens Domke and Toshio Endo.}, title = {Automatic translation of CUDA code into high performance CPU code using LLVM IR transformations.}, booktitle = {}, year = 2022, } @inproceedings{CTT100866035, author = {遠藤 敏夫}, title = {TSUBAMEスーパーコンピュータのAI・ビッグデータ対応と展望}, booktitle = {}, year = 2021, } @inproceedings{CTT100866034, author = {遠藤 敏夫}, title = {TSUBAMEスパコンの過去、現在、未来}, booktitle = {}, year = 2021, } @inproceedings{CTT100861644, author = {相川 洋貴 and 遠藤 敏夫 and 幸 朋矢 and 広渕 崇宏}, title = {時間ブロッキングを用いたステンシル計算のHalide言語による高性能実装と評価 .}, booktitle = {情報処理学会研究報告, 2021-HPC-180, No. 16}, year = 2021, } @inproceedings{CTT100861643, author = {細木 隆豊 and 野村 哲弘 and 遠藤 敏夫}, title = {GPUクラスタにおけるハイブリッド並列DNN学習のボトルネック分析と改良 .}, booktitle = {情報処理学会研究報告, 2021-HPC-180, No. 9}, year = 2021, } @inproceedings{CTT100861647, author = {Shohei Minami and Toshio Endo and Akihiro Nomura}, title = {Measurement and Modeling of Performance of HPC Applications towards Overcommitting Scheduling Systems .}, booktitle = {}, year = 2021, } @inproceedings{CTT100845079, author = {野村 哲弘 and 滝澤 真一朗 and 三浦 信一 and 遠藤 敏夫 and 松葉 浩也}, title = {センサー情報を意識したジョブスケジューリング実現のための標準ジョブ履歴スキーマの提案}, booktitle = {情報処理学会研究報告}, year = 2021, } @inproceedings{CTT100854541, author = {Ivan R. Ivanov and Jens Domke and Akihiro Nomura and Toshio Endo}, title = {Improved failover for HPC interconnects through localised routing restoration}, booktitle = {}, year = 2021, } @inproceedings{CTT100854537, author = {Shohei Minami and Toshio Endo and Akihiro Nomura}, title = {Performance Modeling of HPC Applications on Overcommitted Systems}, booktitle = {Proceedings of HPC Asia 2021}, year = 2021, } @inproceedings{CTT100845078, author = {安良岡 由規 and 野村 哲弘 and 遠藤 敏夫}, title = {学内インフラとしてのスパコンの対話的利用による利便性向上}, booktitle = {}, year = 2020, } @inproceedings{CTT100829261, author = {野村 哲弘 and 遠藤 敏夫 and 三浦 信一 and 朝倉 博紀 and 越野 俊充 and 草間 俊博}, title = {TSUBAME3のインタラクティブ利用の利便性向上にむけた取り組み}, booktitle = {}, year = 2020, } @inproceedings{CTT100829260, author = {南 将平 and 遠藤 敏夫 and 野村 哲弘}, title = {オーバーコミットスケジュール時のアプリ性能の予備評価}, booktitle = {}, year = 2020, } @inproceedings{CTT100814478, author = {Kazuaki Matsumura and Hamid Reza Zohouri and Mohamed Wahib and Toshio Endo and Satoshi Matsuoka.}, title = {AN5D: Automated Stencil Framework for High-Degree Temporal Blocking on GPUs .}, booktitle = {}, year = 2020, } @inproceedings{CTT100814480, author = {Tomoya Yuki and Toshio Endo.}, title = {Toward Latency-Aware Data Arrangement on Many-Core Processors .}, booktitle = {}, year = 2020, } @inproceedings{CTT100814479, author = {Toshio Endo.}, title = {Integrating Cache Oblivious Approach with Modern Processor Architecture: The Case of Floyd-Warshall Algorithm.}, booktitle = {}, year = 2020, } @inproceedings{CTT100802670, author = {Toshio Endo}, title = {Activity Report from Tokyo Tech:Energy Efficiency of TSUBAME3.0.}, booktitle = {}, year = 2019, } @inproceedings{CTT100802674, author = {野村 哲弘 and 三浦 信一 and 實本 英之 and 額田 彰 and 遠藤 敏夫}, title = {TSUBAME3.0におけるストレージ利用効率化のためのファイルシステムベンチマーク}, booktitle = {}, year = 2019, } @inproceedings{CTT100802673, author = {土川 稔生 and 遠藤 敏夫 and 野村 哲弘 and 近藤正章 and 大山 洋介 and 松岡 聡}, title = {メモリアクセスデータを用いた機械学習によるアプリケーションの類型化}, booktitle = {}, year = 2019, } @inproceedings{CTT100793584, author = {Toshio Endo}, title = {Current Status of TSUBAME3.0 Operation (as of Mar 2019)}, booktitle = {}, year = 2019, } @inproceedings{CTT100789659, author = {Yuki Ito and Haruki Imai and Tung Le Duc and Yasushi Negishi and Kiyokuni Kawachiya and Ryo Matsumiya and Toshio Endo}, title = {Profiling based out-of-core hybrid method for large neural networks .}, booktitle = {}, year = 2019, } @inproceedings{CTT100775520, author = {遠藤敏夫}, title = {光インターコネクト技術を用いたTSUBAME3.0スーパーコンピュータ}, booktitle = {}, year = 2018, } @inproceedings{CTT100770041, author = {Ryo Matsumiya and Toshio Endo}, title = {RMA-based Communication Library Featuring Node-local NVMs}, booktitle = {}, year = 2018, } @inproceedings{CTT100770043, author = {Toshio Endo}, title = {Applying Recursive Temporal Blocking for Stencil Computations to Deeper Memory Hierarchy}, booktitle = {}, year = 2018, } @inproceedings{CTT100770511, author = {伊藤 祐貴 and 今井 晴基 and レドゥック トゥン and 根岸 康 and 河内谷 清久仁 and 松宮 遼 and 遠藤 敏夫}, title = {GPUメモリ管理の実行時最適化による大規模深層学習の高速化}, booktitle = {情報処理学会研究報告, 2018-HPC-165 No.30}, year = 2018, } @inproceedings{CTT100770037, author = {見村 朔 and 遠藤敏夫}, title = {LSTM を用いた映像分類システムの学習順序による高速化}, booktitle = {}, year = 2018, } @inproceedings{CTT100770039, author = {Ryo Matsumiya and Toshio Endo}, title = {vGASNet: Scalable RMA-based Communication Library for Out-of-core Data Processing}, booktitle = {}, year = 2018, } @inproceedings{CTT100770038, author = {伊藤 祐貴 and Haruki Imai and Tung Le Duc and Yasushi Negishi and Kiyokuni Kawachiya and 松宮 遼 and 遠藤 敏夫}, title = {Runtime GPU Memory Optimization for Supporting Large Neural Networks on Chainer}, booktitle = {}, year = 2018, } @inproceedings{CTT100765681, author = {遠藤敏夫}, title = {TSUBAME3.0冷却システムの紹介}, booktitle = {}, year = 2018, } @inproceedings{CTT100765684, author = {Toshio Endo}, title = {Realizing Extremely Large-Scale Scientific Applications Using Deep Memory Hierarchy.}, booktitle = {}, year = 2018, } @inproceedings{CTT100765683, author = {Noboru Tanabe and Toshio Endo.}, title = {Evaluation of Memory-Latency Sensitivity on Manycore Processors with Large Cache.}, booktitle = {}, year = 2018, } @inproceedings{CTT100765682, author = {Noboru Tanabe and Toshio Endo.}, title = {Characterizing Memory-Latency Sensitivity of Sparse Matrix Kernels.}, booktitle = {}, year = 2018, } @inproceedings{CTT100756795, author = {Yuki Ito and Ryo Matsumiya and Toshio Endo.}, title = {ooc_cuDNN: Accommodating Convolutional Neural Networks over GPU Memory Capacity.}, booktitle = {}, year = 2017, } @inproceedings{CTT100765685, author = {Toshio Endo and Hiroko Midorikawa and Yukinori Sato.}, title = {Software Technology that Deals with Deeper Memory Hierarchy in Post-petascale Era.}, booktitle = {}, year = 2017, } @inproceedings{CTT100756801, author = {藤田 和宏 and 鶴見慶 and 安良岡由規 and 根本忍 and 梁井善行 and 渡邊寿雄 and 野村 哲弘 and 三浦信一 and 額田彰 and 遠藤敏夫 and 松岡聡}, title = {新スーパーコンピュータTSUBAME3.0の概要.}, booktitle = {}, year = 2017, } @inproceedings{CTT100756800, author = {Toshio Endo and Satoshi Matsuoka.}, title = {TSUBAME3.0: A Green, Accelerated, Big-Data Supercomputer}, booktitle = {}, year = 2017, } @inproceedings{CTT100756799, author = {Yuki Ito and Ryo Matsumiya and Toshio Endo.}, title = {ooc_cuDNN : A Deep Learning Library Supporting CNNs over GPU Memory Capacity.}, booktitle = {}, year = 2017, } @inproceedings{CTT100756796, author = {Shota Kuroda and Toshio Endo and Satoshi Matsuoka.}, title = {Applying Temporal Blocking with a Directive-based Approach.}, booktitle = {}, year = 2017, } @inproceedings{CTT100754125, author = {Takashi Shimokawabe and Toshio Endo and Naoyuki Onodera and Takayuki Aoki.}, title = {A Stencil Framework to Realize Large-scale Computations Beyond Device Memory Capacity on GPU Supercomputers.}, booktitle = {}, year = 2017, } @inproceedings{CTT100768360, author = {Takashi Shimokawabe and Toshio Endo and Naoyuki Onodera and TAKAYUKI AOKI}, title = {A Stencil Framework to Realize Large-scale Computations Beyond Device Memory Capacity on GPU Supercomputers}, booktitle = {}, year = 2017, } @inproceedings{CTT100745563, author = {Yukinori Sato and Toshio Endo}, title = {An Accurate Simulator of Cache-line Conflicts to Exploit the Underlying Cache Performance}, booktitle = {}, year = 2017, } @inproceedings{CTT100747655, author = {松岡 聡 and 遠藤 敏夫 and 額田 彰 and 三浦 信一 and 野村 哲弘 and 佐藤 仁 and 實本 英之 and Drozd Aleksandr}, title = {HPCとビッグデータ・AIを融合するグリーン・クラウドスパコンTSUBAME3.0の概要}, booktitle = {}, year = 2017, } @inproceedings{CTT100747665, author = {伊藤 祐貴 and 松宮 遼 and 遠藤 敏夫}, title = {ooc_cuDNN: GPU計算機のメモリ階層を利用した大規模深層学習ライブラリの開発}, booktitle = {}, year = 2017, } @inproceedings{CTT100747658, author = {幸 朋矢 and 佐藤 幸紀 and 遠藤 敏夫}, title = {Polyhedralコンパイラを用いたタイリングパラメータ自動調整ツールのメニーコア環境での評価}, booktitle = {}, year = 2017, } @inproceedings{CTT100747654, author = {田邊 昇 and 遠藤 敏夫}, title = {Intel Xeon Phiにおける主記憶遅延増加の影響評価}, booktitle = {}, year = 2017, } @inproceedings{CTT100747653, author = {松宮 遼 and 遠藤 敏夫}, title = {vGASNet: メモリ階層深化に向けたスケーラブルな低レイヤ通信ライブラリ}, booktitle = {}, year = 2017, } @inproceedings{CTT100741315, author = {Yukinori Sato and Tomoya Yuki and Toshio Endo}, title = {ExanaDBT: A Dynamic Compilation System for Transparent Polyhedral Optimizations at Runtime}, booktitle = {}, year = 2017, } @inproceedings{CTT100737176, author = {伊藤祐貴 and 松宮遼 and 遠藤敏夫}, title = {メモリ階層の利用によってGPUメモリ容量を超える深層学習手法}, booktitle = {}, year = 2017, } @inproceedings{CTT100741317, author = {松宮遼 and 遠藤敏夫}, title = {Flash SSD を活用する PGAS フレームワークに対する協調キャッシングの導入}, booktitle = {}, year = 2017, } @inproceedings{CTT100737178, author = {田邊 昇 and 遠藤 敏夫}, title = {疎行列系アプリケーション性能の主記憶遅延増加の影響評価}, booktitle = {2017-HPC-158 No.15}, year = 2017, } @inproceedings{CTT100737180, author = {本山 義史 and 遠藤 敏夫 and 松岡 聡 and 横田 理央 and 福田 圭祐 and 佐藤 育郎}, title = {低ランク近似行列によるCNNにおける畳み込み演算の最適化}, booktitle = {2017-HPC-158 No.25}, year = 2017, } @inproceedings{CTT100748520, author = {Takashi Shimokawabe and Toshio Endo and Naoyuki Onodera and Takayuki Aoki}, title = {Performance Evaluation of Wind Simulation Based on a GPU-computing Framework to Realize Large-scale Stencil Computations Beyond Device Memory Capacity}, booktitle = {}, year = 2017, } @inproceedings{CTT100737181, author = {Takashi Shimokawabe and Toshio Endo and Naoyuki Onodera and Takayuki Aoki}, title = {Performance Evaluation of Wind Simulation Based on a GPU-computing Framework to Realize Large-scale Stencil Computations Beyond Device Memory Capacity.}, booktitle = {}, year = 2017, } @inproceedings{CTT100736012, author = {佐藤幸紀 and 幸朋矢 and 遠藤敏夫}, title = {透過的メモリ階層チューニングのための動的バイナリ変換機構の設計と開発}, booktitle = {2016-ARC-216 No.35}, year = 2017, } @inproceedings{CTT100735528, author = {田邊昇 and 遠藤敏夫}, title = {中遅延大容量メモリ階層出現のインパクトと新たな対応に関する初期検討}, booktitle = {2015-HPC-157 No.11}, year = 2016, } @inproceedings{CTT100736772, author = {黒田 勝汰 and 遠藤 敏夫 and 松岡 聡}, title = {ディレクティブによる時空間ブロッキングの自動適用}, booktitle = {}, year = 2016, } @inproceedings{CTT100733946, author = {Satoshi Imamura and Keitaro Oka and Yuichiro Yasui and Yuichi Inadomi and Katsuki Fujisawa and Toshio Endo and Koji Ueno and Keiichiro Fukazawa and Nozomi Hata and Yuta Kakibuka and Koji Inoue and Takatsugu Ono}, title = {Evaluating the Impacts of Code-Level Performance Tunings on Power Efficiency}, booktitle = {}, year = 2016, } @inproceedings{CTT100735583, author = {遠藤敏夫}, title = {ポストペタスケール時代のメモリ階層の深化に対応するソフトウェア技術}, booktitle = {}, year = 2016, } @inproceedings{CTT100733942, author = {Ryo Matsumiya and Toshio Endo}, title = {PGAS Communication Runtime for Extreme Large Data Computation}, booktitle = {}, year = 2016, } @inproceedings{CTT100710139, author = {Toshio Endo}, title = {Realizing Out-of-Core Stencil Computations using Multi-Tier Memory Hierarchy on GPGPU Clusters}, booktitle = {In Proceedings of IEEE Cluster Computing (CLUSTER2016)}, year = 2016, } @inproceedings{CTT100713022, author = {佐藤真平 and 佐藤幸紀 and 遠藤敏夫}, title = {ステンシル計算コードの性能とメモリレイアウトの関係性について}, booktitle = {情報処理学会研究報告}, year = 2016, } @inproceedings{CTT100713021, author = {松岡 聡 and 天野 英晴 and 中島 研吾 and 井上 弘士 and 工藤 知宏 and 丸山 直也 and 田浦 健次朗 and 岩下 武史 and 片桐 孝洋 and 塙敏博 and 遠藤 敏夫}, title = {ポストムーア時代におけるFLOPSからBYTESへの変革}, booktitle = {情報処理学会研究報告, 2016-HPC-155 No.32}, year = 2016, } @inproceedings{CTT100713020, author = {松宮 遼 and 遠藤 敏夫}, title = {Flash SSDを含む多階層メモリを活用するPGASランタイムシステム}, booktitle = {情報処理学会研究報告, 2016-HPC-155 No.31}, year = 2016, } @inproceedings{CTT100748559, author = {下川辺 隆史 and 遠藤敏夫 and 青木 尊之}, title = {GPU デバイスメモリを超える計算を可能とするためのステンシル計算フレームワークの拡張とその性能評価}, booktitle = {}, year = 2016, } @inproceedings{CTT100713023, author = {下川辺 隆史 and 遠藤 敏夫 and 青木 尊之}, title = {GPUデバイスメモリを超える計算を可能とするためのステンシル計算フレームワークの拡張とその性能評価}, booktitle = {}, year = 2016, } @inproceedings{CTT100710150, author = {Toshio Endo}, title = {Operating Experience with SSD and GPUs}, booktitle = {}, year = 2016, } @inproceedings{CTT100710144, author = {Satoshi Matsuoka and Hideharu Amano and Kengo Nakajima and Koji Inoue and Tomohiro Kudoh and Naoya Maruyama and Kenjiro Taura and Takeshi Iwashita and Takahiro Katagiri and Toshihiro Hanawa and Toshio Endo}, title = {From FLOPS to BYTES: Disruptive Change in High-Performance Computing towards the Post-Moore Era}, booktitle = {}, year = 2016, } @inproceedings{CTT100703204, author = {Yukinori Sato and Toshio Endo.}, title = {Dynamic Compilation for Transparent Data Locality Analysis and Memory Subsystem Tuning .}, booktitle = {}, year = 2016, } @inproceedings{CTT100713185, author = {遠藤 敏夫}, title = {大規模・高性能演算のための多階層メモリの活用}, booktitle = {}, year = 2016, } @inproceedings{CTT100702723, author = {Toshio Endo}, title = {Harnessing Multi-tier Memory Hierarchy of GPU, Host and Flash.}, booktitle = {}, year = 2016, } @inproceedings{CTT100700936, author = {Shimpei Sato and Yukinori Sato and Toshio Endo}, title = {A Cache-aware Temporal Blocking Method for 3D Stencil Computation}, booktitle = {}, year = 2016, } @inproceedings{CTT100713188, author = {松宮遼 and 遠藤敏夫 and 大山恵弘}, title = {深化する記憶装置階層のための大規模データ処理基盤の提案}, booktitle = {}, year = 2016, } @inproceedings{CTT100713190, author = {Yukinori Sato and Toshio Endo}, title = {Consolidating memory locality information obtained from static and dynamic analysis of code for performance tuning in source code}, booktitle = {}, year = 2016, } @inproceedings{CTT100812227, author = {Fujisawa, K. and Toshio Endo and Yasui, Y.}, title = {Advanced computing and optimization infrastructure for extremely large-scale graphs on post peta-scale supercomputers}, booktitle = {Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics)}, year = 2016, } @inproceedings{CTT100698043, author = {Toshio Endo and Yuki Takasaki and Satoshi Matsuoka}, title = {Realizing Extremely Large-Scale Stencil Applications on GPU Supercomputers}, booktitle = {In Proceedings of The 21st IEEE International Conference on Parallel and Distributed Systems (ICPADS 2015)}, year = 2015, } @inproceedings{CTT100704611, author = {野村 哲弘 and 佐々木 淳 and 三浦 信一 and 遠藤 敏夫 and 松岡 聡}, title = {TSUBAME2におけるジョブスケジューリング効率化への取り組みと検証}, booktitle = {大学ICT推進協議会 2015年度年次大会 企画セッション HPCテクノロジー}, year = 2015, } @inproceedings{CTT100698044, author = {Yuki Tsujita and Toshio Endo and Katsuki Fujisawa}, title = {The Scalable Petascale Data-Driven Approach for the Cholesky Factorization with Multiple GPUs}, booktitle = {}, year = 2015, } @inproceedings{CTT100702721, author = {Toshio Endo and Akira Nukada and Satoshi Matsuoka}, title = {Power Capping Scheduling on TSUBAME2.5 and Upgrade of TSUBAME-KFC.}, booktitle = {}, year = 2015, } @inproceedings{CTT100698046, author = {Shimpei Sato and Yukinori Sato and Toshio Endo}, title = {Investigating Potential Performance Benefits of Memory Layout Optimization based on Roofline Model}, booktitle = {}, year = 2015, } @inproceedings{CTT100698045, author = {Yukinori Sato and Shimpei Sato and Toshio Endo}, title = {Exana: An Execution-driven Application Analysis Tool for Assisting Productive Performance Tuning}, booktitle = {}, year = 2015, } @inproceedings{CTT100718427, author = {佐藤幸紀 and 佐藤真平 and 遠藤敏夫}, title = {CPU性能チューニングを支援するアプリケーション解析ツールExanaのデモ}, booktitle = {}, year = 2015, } @inproceedings{CTT100718425, author = {佐藤真平 and 佐藤幸紀 and 遠藤敏夫}, title = {テンポラルブロッキングを適用したステンシル計算コードのSIMD化とルーフラインモデルを用いた性能解析}, booktitle = {}, year = 2015, } @inproceedings{CTT100713187, author = {佐藤真平 and 佐藤幸紀 and 遠藤敏夫}, title = {ルーフラインモデルによる性能幅推定とステンシル計算コードにおけるメモリレイアウト最適化による性能最大化}, booktitle = {情報処理学会研究報告}, year = 2015, } @inproceedings{CTT100713186, author = {佐藤幸紀 and 遠藤敏夫}, title = {実行駆動型キャッシュシミュレーションおよびメモリ参照特性解析におけるオーバーヘッドの評価}, booktitle = {}, year = 2015, } @inproceedings{CTT100704613, author = {野村 哲弘 and 佐々木 淳 and 三浦 信一 and 遠藤 敏夫 and 松岡 聡}, title = {TSUBAME2におけるスケジュール効率化への取り組みとユーザ動向の見える化}, booktitle = {情報処理学会 研究報告}, year = 2015, } @inproceedings{CTT100704618, author = {寺西 賢人 and 野村 哲弘 and 遠藤 敏夫 and 松岡 聡}, title = {ノード内同時実行ジョブにおけるパフォーマンスカウンタによるプロセス毎消費電力のモデル化}, booktitle = {情報処理学会 研究報告}, year = 2015, } @inproceedings{CTT100696279, author = {Toshio Endo and Satoshi Matsuoka.}, title = {Realizing Extremely Large-Scale Stencil Applications on GPU Supercomputers with a Memory Hierarchy Management Runtime Library. Workshop on Programming Abstractions for Data Locality (PADAL 2015), Berkeley}, booktitle = {}, year = 2015, } @inproceedings{CTT100691824, author = {Yuki Tsujita and Toshio Endo.}, title = {Data Driven Scheduling Approach for the Multi-node Multi-GPU Cholesky Decomposition}, booktitle = {}, year = 2015, } @inproceedings{CTT100691812, author = {Kazuki Tsuzuku and Toshio Endo.}, title = {Power Capping of CPU-GPU Heterogeneous Systems Using Power and Performance Models}, booktitle = {}, year = 2015, } @inproceedings{CTT100713191, author = {辻田裕紀 and 遠藤敏夫}, title = {マルチノード・マルチGPU上のコレスキー分解に対するデータドリブン型アルゴリズム手法}, booktitle = {}, year = 2015, } @inproceedings{CTT100704609, author = {野村 哲弘 and 三浦 信一 and 遠藤 敏夫 and 松岡 聡}, title = {アプリケーションのEmpiricalな性能モデル構築のためのプロファイル情報の収集}, booktitle = {}, year = 2015, } @inproceedings{CTT100713192, author = {遠藤敏夫}, title = {異種プロセッサマシンのメモリ階層を活用するHHRT ライブラリの実装}, booktitle = {}, year = 2015, } @inproceedings{CTT100691825, author = {Naoto Sasaki and Kento Sato and Toshio Endo and Satoshi Matsuoka.}, title = {Exploration of Lossy Compression for Application-level Checkpoint/Restart}, booktitle = {}, year = 2015, } @inproceedings{CTT100691850, author = {高嵜 祐樹 and 遠藤 敏夫 and 松岡 聡}, title = {GPUクラスタにおける大規模都市気流シミュレーションの最適化と性能モデル}, booktitle = {}, year = 2015, } @inproceedings{CTT100687008, author = {Toshio Endo}, title = {Harnessing Memory Hierarchy towards Extreme Fast and Big Simulations}, booktitle = {Proc. of 2015 Conference on Advanced Topics and Auto Tuning in High-Performance Scientific Computing.}, year = 2015, } @inproceedings{CTT100687004, author = {Toshio Endo and Akira Nukada and Satoshi Matsuoka}, title = {TSUBAME-KFC: a Modern Liquid Submersion Cooling Prototype towards Exascale Becoming the Greenest Supercomputer in the World}, booktitle = {Proc. of The 20th IEEE International Conference on Parallel and Distributed Systems (ICPADS 2014)}, year = 2014, } @inproceedings{CTT100687003, author = {Guanghao Jin and James Lin and Toshio Endo}, title = {Efficient Utilization of Memory Hierarchy to Enable the Computation on Bigger Domains for Stencil Computation in CPU-GPU Based Systems}, booktitle = {Proc. of IEEE International Conference on High Performance Computing and Applications (ICHPCA-2014)}, year = 2014, } @inproceedings{CTT100687005, author = {Toshio Endo and Guanghao Jin}, title = {Software Technologies Coping with Memory Hierarchy of GPGPU Clusters for Stencil Computations}, booktitle = {Proc. of IEEE Cluster Computing (CLUSTER2014)}, year = 2014, } @inproceedings{CTT100704633, author = {野村哲弘 and 三浦信一 and 遠藤敏夫 and 松岡聡}, title = {実アプリケーションを用いた計算機評価ベンチマークと性能リポジトリの開発}, booktitle = {情報処理学会研究報告}, year = 2014, } @inproceedings{CTT100687011, author = {Guanghao Jin and Toshio Endo}, title = {Data Management and Loop Controlling to Surpass Memory Capacity of GPU in OpenACC Framework}, booktitle = {}, year = 2014, } @inproceedings{CTT100687006, author = {Hiroko Midorikawa and Hideyuki Tan and Toshio Endo}, title = {An Evaluation of the Potential of Flash SSD as Large and Slow Memory for Stencil Computations}, booktitle = {Proc. of The 2014 International Conference on High Performance Computing & Simulation (HPCS 2014)}, year = 2014, } @inproceedings{CTT100691851, author = {Toshio Endo}, title = {Experiences with the 5.7Pflop/s System TSUBAME2.5 at Tokyo Tech}, booktitle = {}, year = 2014, } @inproceedings{CTT100683775, author = {Akihiro Nomura and Shinichi Miura and Toshio Endo and SATOSHI MATSUOKA}, title = {Application Performance Characterization towards Exa-Scale Supercomputers}, booktitle = {}, year = 2014, } @inproceedings{CTT100687007, author = {Katsuki Fujisawa and Toshio Endo and Yuichiro Yasui and Hitoshi Sato and Naoki Matsuzawa and Satoshi Matsuoka and Hayato Waki}, title = {Peta-scale General Solver for Semidefinite Programming Problems with over Two Million Constraints}, booktitle = {Proc. of IEEE International Conference on Parallel and Distributed Processing Symposium 2014 (IPDPS2014)}, year = 2014, } @inproceedings{CTT100668404, author = {松岡 聡 and 佐藤 賢斗 and 遠藤敏夫}, title = {エクサスケールスパコンに向けた耐故障性の評価 --- TSUBAME2.0を例にして ---}, booktitle = {}, year = 2013, } @inproceedings{CTT100687000, author = {Guanghao Jin and Toshio Endo and Satoshi Matsuoka}, title = {A Parallel Optimization Method for Stencil Computation on the Domain that is Bigger than Memory Capacity of GPUs}, booktitle = {Proc. of IEEE Cluster Computing (CLUSTER2013)}, year = 2013, } @inproceedings{CTT100668017, author = {野村哲弘 and 三浦信一 and 遠藤敏夫 and 松岡聡 and 鈴木惣一朗 and 丸山直也}, title = {システム評価のためのアプリケーション性能リポジトリの構築と性能モデルの評価}, booktitle = {情報処理学会 研究報告}, year = 2013, } @inproceedings{CTT100687001, author = {Yukinori Sato and Hiroko Midorikawa and Toshio Endo}, title = {Identifying working data set of particular loop iterations for dynamic performance tuning}, booktitle = {Proc. of Workshop on Architectural and Microarchitectural Support for Binary Translation (AMAS-BT2013)}, year = 2013, } @inproceedings{CTT100687002, author = {Guanghao Jin and Toshio Endo and Satoshi Matsuoka}, title = {A Multi-level Optimization Method for Stencil Computation on the Domain that is Bigger than Memory Capacity of GPU}, booktitle = {Proc. of The Third International Workshop on Accelerators and Hybrid Exascale Systems (AsHES)}, year = 2013, } @inproceedings{CTT100645960, author = {金 光浩 and 遠藤 敏夫 and 松岡 聡}, title = {GPUメモリ容量を超える問題規模に対応する高性能ステンシル計算法}, booktitle = {情報処理学会研究報告}, year = 2012, } @inproceedings{CTT100645961, author = {野村 哲弘 and 遠藤 敏夫 and 松岡 聡}, title = {TSUBAME2.0におけるMulti-rail InfiniBandネットワークの性能評価}, booktitle = {情報処理学会研究報告}, year = 2012, } @inproceedings{CTT100645944, author = {Katsuki Fujisawa and Toshio Endo and Hitoshi Sato and Makoto Yamashita and Satoshi Matsuoka and Maho Nakata}, title = {High-Performance General Solver for Extremely Large-scale Semidefinite Programming Problems}, booktitle = {Proceedings of IEEE/ACM International Conference for High Performance Computing, Networking, Storage and Analysis (SC12)}, year = 2012, } @inproceedings{CTT100632837, author = {Shiqiao Du and Takuro Udagawa and Toshio Endo and Masakazu Sekijima}, title = {Molecular Dynamics Simulation of a Biomolecule with High Speed, Low Power and Accuracy Using GPU-Accelerated TSUBAME2.0 Supercomputer}, booktitle = {Proceedings of Asia-Pacific Signal and Information Processing Association Annual Summit and Conference (APSIPA ASC 2011)}, year = 2011, } @inproceedings{CTT100632836, author = {Massimo Bernaschi and Mauro Bisson and Toshio Endo and Massimiliano Fatica and Satoshi Matsuoka and Simone Melchionna and Sauro Succi}, title = {Petaflop Biofluidics Simulations On A Two Million-Core System}, booktitle = {Proceedings of IEEE/ACM International Conference for High Performance Computing, Networking, Storage and Analysis (SC11)}, year = 2011, } @inproceedings{CTT100632835, author = {Takashi Shimokawabe and Takayuki Aoki and Tomohiro Takaki and Akinori Yamanaka and Akira Nukada and Toshio Endo and Naoya Maruyama and Satoshi Matsuoka}, title = {Peta-scale Phase-Field Simulation for Dendritic Solidification on the TSUBAME 2.0 Supercomputer}, booktitle = {Proceedings of IEEE/ACM International Conference for High Performance Computing, Networking, Storage and Analysis (SC11)}, year = 2011, } @inproceedings{CTT100632833, author = {遠藤 敏夫 and 額田 彰 and 松岡 聡 and 長坂 真路 and 四津 匡康}, title = {グリーンスパコンTSUBAME2.0における電力危機対応運用}, booktitle = {情報処理学会研究報告}, year = 2011, } @inproceedings{CTT100632838, author = {Irina Demeshko and Satoshi Matsuoka and Toshio Endo}, title = {GPU-based approach for elastic-plastic deformation simulation}, booktitle = {IPSJ SIG Technical Report}, year = 2011, } @inproceedings{CTT100619970, author = {遠藤 敏夫 and 額田 彰 and 松岡 聡}, title = {スーパーコンピュータTSUBAME 2.0 における Linpack 性能1 ペタフロップス超の達成}, booktitle = {情報処理学会SACSIS2011論文集}, year = 2011, } @inproceedings{CTT100620557, author = {Tatsuo Nomura and Naoya Maruyama and Toshio Endo and Satoshi Matsuoka}, title = {A Sequential Programming Framework for Large-Scale GPU-Accelerated Structured Grids}, booktitle = {}, year = 2011, } @inproceedings{CTT100617857, author = {野村 達雄 and 丸山 直也 and 遠藤 敏夫 and 松岡 聡}, title = {ステンシル計算を対象とした大規模GPUクラスタ向け自動並列化フレームワーク}, booktitle = {}, year = 2011, } @inproceedings{CTT100617846, author = {遠藤 敏夫 and 額田 彰 and 松岡 聡}, title = {ヘテロ型スーパーコンピュータTSUBAME 2.0のLinpackによる性能評価}, booktitle = {情報処理学会研究報告}, year = 2010, } @inproceedings{CTT100617785, author = {島田 大地 and 遠藤 敏夫 and 丸山 直也 and 松岡 聡}, title = {OpenCLを用いた異種GPUにおける性能特性に応じた最適化}, booktitle = {情報処理学会研究報告}, year = 2010, } @inproceedings{CTT100617842, author = {長坂 仁 and 丸山 直也 and 額田 彰 and 遠藤 敏夫 and 松岡 聡}, title = {GPUにおけるモデルに基づいた電力効率の最適化}, booktitle = {情報処理学会研究報告}, year = 2010, } @inproceedings{CTT100617844, author = {野村 達雄 and 丸山 直也 and 遠藤 敏夫 and 松岡 聡}, title = {ステンシル計算を対象とした大規模GPUクラスタ向け自動並列化フレームワーク}, booktitle = {情報処理学会研究報告}, year = 2010, } @inproceedings{CTT100617868, author = {Takashi Shimokawabe and Takayuki Aoki and Chiashi Muroi and Junichi Ishida and Kohei Kawano and Toshio Endo and Akira Nukada and Naoya Maruyama and Satoshi Matsuoka}, title = {An 80-Fold Speedup, 15.0 TFlops, Full GPU Acceleration of Non-Hydrostatic Weather Model ASUCA Production Code}, booktitle = {Proceedings of IEEE/ACM International Conference for High Performance Computing, Networking, Storage and Analysis (SC10)}, year = 2010, } @inproceedings{CTT100618099, author = {Nguyen Toan and Tatsuo Nomura and Hideyuki Jitsumoto and Naoya Maruyama and Toshio Endo and Satoshi Matsuoka}, title = {MPI-CUDA Application Checkpointing}, booktitle = {GPU Technology Conference 2010}, year = 2010, } @inproceedings{CTT100617853, author = {野村 達雄 and 丸山 直也 and 遠藤 敏夫 and 松岡 聡}, title = {GPUクラスタを対象にした並列ステンシル計算の自動コード生成フレームワーク}, booktitle = {情報処理学会研究報告}, year = 2010, } @inproceedings{CTT100617861, author = {Nguyen Toan and Hideyuki Jitsumoto and Naoya Maruyama and Tatsuo Nomura and Toshio Endo and Satoshi Matsuoka}, title = {MPI-CUDA Applications Checkpointing}, booktitle = {IPSJ SIG Technical Report}, year = 2010, } @inproceedings{CTT100617864, author = {Hitoshi Nagasaka and Naoya Maruyama and Akira Nukada and Toshio Endo and SATOSHI MATSUOKA}, title = {Statistical Power Modeling of GPU Kernels Using Performance Counters}, booktitle = {Proceedings of IEEE International Green Computing Conference (IGCC'10),}, year = 2010, } @inproceedings{CTT100596776, author = {Toshio Endo and Akira Nukada and SATOSHI MATSUOKA and Naoya Maruyama}, title = {Linpack Evaluation on a Supercomputer with Heterogeneous Accelerators}, booktitle = {Proceedings of IEEE International Parallel & Distributed Processing Symposium (IPDPS 2010)}, year = 2010, } @inproceedings{CTT100600516, author = {浜野智明 and 額田彰 and 遠藤敏夫 and 松岡聡}, title = {GPUクラスタにおける省電力タスクスケジューリング}, booktitle = {情報処理学会研究報告2010-HPC-124}, year = 2010, } @inproceedings{CTT100600603, author = {渡辺祐也 and 遠藤敏夫 and 松岡聡}, title = {GPU クラスタにおける科学技術計算の自動最適化}, booktitle = {情報処理学会研究報告}, year = 2010, } @inproceedings{CTT100596824, author = {實本英之 and 中村俊介 and 遠藤敏夫 and 松岡聡}, title = {増分データとErasure Coding を利用した高速なチェックポイント手法}, booktitle = {情報処理学会研究報告}, year = 2009, } @inproceedings{CTT100596826, author = {遠藤 敏夫 and 額田 彰 and 松岡 聡 and 丸山 直也}, title = {異種アクセラレータを持つヘテロ型スーパーコンピュータ上のLinpack の性能向上手法}, booktitle = {情報処理学会研究報告}, year = 2009, } @inproceedings{CTT100596719, author = {長坂仁 and 丸山直也 and 額田 彰 and 遠藤 敏夫 and 松岡 聡}, title = {GPU における性能と消費電力 の相関性の解析}, booktitle = {情報処理学会研究報告2009-HPC-121}, year = 2009, } @inproceedings{CTT100596794, author = {Satoshi Matsuoka and Takayuki Aoki and Toshio Endo and Akira Nukada and Toshihiro Kato and Atsushi Hasegawa}, title = {GPU accelerated computing–from hype to mainstream, the rebirth of vector computing}, booktitle = {Journal of Physics: Conference Series}, year = 2009, } @inproceedings{CTT100596720, author = {島田大地 and 丸山直也 and 額田彰 and 遠藤 敏夫 and 松岡 聡}, title = {GPUにおける耐故障性を考慮した数値計算の電力性能}, booktitle = {情報処理学会研究報告2009-HPC-121}, year = 2009, } @inproceedings{CTT100596815, author = {Toshio Endo}, title = {Supercomputing on The TSUBAME GPU-Accelerated Cluster}, booktitle = {}, year = 2009, } @inproceedings{CTT100596795, author = {加藤季広 and 青木尊之 and 額田彰 and 遠藤敏夫 and 松岡聡 and 長谷川篤史}, title = {姫野ベンチマークのGPUマルチノード実行における通信と演算のオーバーラップによる高速化 ~ 32GPUで700GFLOPS超を達成 ~}, booktitle = {情報処理学会研究報告「ハイパフォーマンスコンピューティング(HPC)」}, year = 2009, } @inproceedings{CTT100596748, author = {Hitoshi Sato and Satoshi Matsuoka and Toshio Endo}, title = {File Clustering Based Replication Algorithm in a Grid Environment}, booktitle = {Proceedings of the 2009 9th IEEE/ACM International Symposium on Cluster Computing and the Grid}, year = 2009, } @inproceedings{CTT100596744, author = {島田大地 and 丸山直也 and 額田 彰 and 遠藤 敏夫 and 松岡 聡}, title = {GPUにおける耐故障性を考慮した数値計算の電力性能}, booktitle = {先進的計算シンポジウム (SACSIS2009)、ポスター発表}, year = 2009, } @inproceedings{CTT100596743, author = {長坂仁 and 丸山直也 and 額田 彰 and 遠藤 敏夫 and 松岡 聡}, title = {GPUにおける性能と消費電力の相関性の解析}, booktitle = {先進的計算シンポジウム (SACSIS2009)、ポスター発表}, year = 2009, } @inproceedings{CTT100596729, author = {Tomoaki Hamano and Toshio Endo and Satoshi Matsuoka}, title = {Power-Aware Dynamic Task Scheduling for Heterogeneous Accelerated Clusters}, booktitle = {2009 IEEE International Symposium on Parallel&Distributed Processing}, year = 2009, } @inproceedings{CTT100575653, author = {Hideyuki Jitsumoto and Toshio Endo and Satoshi Matsuoka}, title = {Environmental-aware optimization of MPI checkpointing intervals}, booktitle = {HPC ASIA 2009}, year = 2009, } @inproceedings{CTT100575630, author = {遠藤敏夫 and 額田彰 and 松岡聡 and 丸山直也 and 實本英之}, title = {四種プロセッサからなるヘテロ型スーパーコンピュータにおけるLinpackチューニング}, booktitle = {計算機アーキテクチャ・ハイパフォーマンスコンピューティング合同研究発表会(HOKKE-2009)論文集}, year = 2009, } @inproceedings{CTT100575631, author = {細萱祐人 and 遠藤敏夫 and 松岡聡}, title = {スワップコストの動的推定によるメモリの省電力化手法}, booktitle = {}, year = 2009, } @inproceedings{CTT100575632, author = {山崎翔平 and 遠藤敏夫 and 松岡聡}, title = {プロセス間共通メモリイメージを考慮したマイグレーション最適化}, booktitle = {}, year = 2009, } @inproceedings{CTT100575635, author = {遠藤敏夫 and 額田彰 and 松岡聡 and 丸山直也 and 實本英之}, title = {四種プロセッサからなるヘテロ型スーパーコンピュータにおけるLinpackチューニング}, booktitle = {ハイパフォーマンスコンピューティングと計算科学シンポジウム(HPCS2009)論文集}, year = 2009, } @inproceedings{CTT100575636, author = {山崎翔平 and 遠藤敏夫 and 松岡聡}, title = {プロセス間共通メモリイメージを考慮したマイグレーション最適化}, booktitle = {}, year = 2009, } @inproceedings{CTT100573993, author = {尾形泰彦 and 額田彰 and 丸山直也 and 遠藤敏夫 and 松岡聡}, title = {複数 GPU システムに対応する自動最適化 3D-FFT ライブラリ}, booktitle = {ハイパフォーマンスコンピューティングと計算科学シンポジウム(HPCS2009)論文集}, year = 2009, } @inproceedings{CTT100575637, author = {細萱祐人 and 遠藤敏夫 and 松岡聡}, title = {SWAPアクセス数の実行時推定によるメモリの省電力化手法}, booktitle = {}, year = 2009, } @inproceedings{CTT100596758, author = {滝澤 真一朗 and 遠藤敏夫 and 松岡聡}, title = {光サーキットネットワークの補助的利用によるHPCアプリケーション性能向上}, booktitle = {情報処理学会 ハイパフォーマンスコンピューティングと計算科学シンポジウム(HPCS2009)}, year = 2009, } @inproceedings{CTT100575652, author = {Akira Nukada and Yasuhiko Ogata and Toshio Endo and Satoshi Matsuoka}, title = {Bandwidth intensive 3-D FFT kernel for GPUs using CUDA}, booktitle = {Proceedings of the 2008 ACM/IEEE conference on Supercomputing (SC08)}, year = 2008, } @inproceedings{CTT100571813, author = {Satoshi Matsuoka and Yutaka Akiyama and Akira Nukada and Toshio Endo and Yasuhiko Ogata and Fumikazu Konishi}, title = {HPC-GPGPU: Large-scale commodity accelerated clusters and its application to advanced structural proteomics}, booktitle = {}, year = 2008, } @inproceedings{CTT100576078, author = {Hideyuki Jitsumoto and Toshio Endo and Satoshi Matsuoka}, title = {Environmental-aware optimization of MPI checkpointing intervals}, booktitle = {The 2008 IEEE International Conference on Cluster Computing (Cluster 2008)}, year = 2008, } @inproceedings{CTT100576166, author = {Hitoshi Sato and Satoshi Matsuoka and Toshio Endo and Naoya Maruyama}, title = {Access-pattern and bandwidth aware file replication algorithm in a grid environment}, booktitle = {The 9th IEEE/ACM International Conference on Grid Computing (Grid 2008)}, year = 2008, } @inproceedings{CTT100574002, author = {遠藤敏夫}, title = {TSUBAMEにおけるアクセラレータの利用状況について}, booktitle = {}, year = 2008, } @inproceedings{CTT100575643, author = {遠藤敏夫}, title = {アクセラレータを用いた大規模ヘテロ環境におけるLinpack}, booktitle = {}, year = 2008, } @inproceedings{CTT100575629, author = {滝澤 真一朗 and 遠藤敏夫 and 松岡聡}, title = {光ネットワークの補助的利用によるHPC性能向上}, booktitle = {}, year = 2008, } @inproceedings{CTT100575626, author = {浜野智明 and 遠藤敏夫 and 松岡聡}, title = {ヘテロ計算環境のための省電力タスクスケジューリング}, booktitle = {}, year = 2008, } @inproceedings{CTT100575627, author = {渡辺祐也 and 遠藤敏夫 and 松岡聡}, title = {複数GPUにおけるセルフスケジューリングによる並列数値演算}, booktitle = {}, year = 2008, } @inproceedings{CTT100575628, author = {佐藤 仁 and 松岡聡 and 遠藤敏夫}, title = {広域分散ファイルシステムにおけるアクセスパターンと性能を考慮したファイル配置}, booktitle = {}, year = 2008, } @inproceedings{CTT100573982, author = {丸山直也 and 松岡聡 and 尾形泰彦 and 額田彰 and 遠藤敏夫}, title = {ソフトウェアECCによるGPUメモリの耐故障性の実現と評価}, booktitle = {}, year = 2008, } @inproceedings{CTT100573986, author = {千葉立寛 and 遠藤敏夫 and 松岡聡}, title = {グリッド環境におけるMPI Scatter/Gather通信アルゴリズムの最適化}, booktitle = {}, year = 2008, } @inproceedings{CTT100575633, author = {浜野智明 and 遠藤敏夫 and 松岡聡}, title = {ヘテロ計算環境のための省電力タスクスケジューリング}, booktitle = {}, year = 2008, } @inproceedings{CTT100575634, author = {渡辺裕也 and 遠藤敏夫 and 松岡聡}, title = {不均一な複数GPUにおけるセルフスケジューリングによる並列数値演算}, booktitle = {}, year = 2008, } @inproceedings{CTT100574006, author = {額田彰 and 尾形泰彦 and 遠藤敏夫 and 松岡聡}, title = {CUDA 環境における高性能3次元FFT}, booktitle = {情報処理学会 先進的計算基盤システムシンポジウム(SACSIS2008)}, year = 2008, } @inproceedings{CTT100575648, author = {Yuto Hosogaya and Toshio Endo and Satoshi Matsuoka}, title = {Performance evaluation of parallel applications on next generation memory architecture with power-aware paging method}, booktitle = {The Fourth Workshop on High-Performance, Power-Aware Computing (HPPAC), in conjunction with IEEE IPDPS 2008}, year = 2008, } @inproceedings{CTT100575651, author = {Toshio Endo and Satoshi Matsuoka}, title = {Massive supercomputing coping with heterogeneity of modern accelerators}, booktitle = {IEEE International Parallel & Distributed Processing Symposium (IPDPS 2008)}, year = 2008, } @inproceedings{CTT100575650, author = {Shin'ichiro Takizawa and Toshio Endo and Satoshi Matsuoka}, title = {Locality aware MPI communication on a commodity opto-electronic hybrid network}, booktitle = {Workshop on Large-Scale Parallel Processing (LSPP), in conjunction with IEEE IPDPS 2008}, year = 2008, } @inproceedings{CTT100575649, author = {Yasuhiko Ogata and Toshio Endo and Naoya Maruyama and Satoshi Matsuoka}, title = {An efficient, model-based CPU-GPU heterogeneous FFT library}, booktitle = {International Heterogeneity in Computing Workshop (HCW '08), in conjunction with IEEE IPDPS 2008}, year = 2008, } @inproceedings{CTT100575639, author = {滝澤 真一朗 and 遠藤敏夫 and 松岡聡}, title = {情報爆発時代の光インターコネクト上でのMPI通信アルゴリズム}, booktitle = {}, year = 2008, } @inproceedings{CTT100575642, author = {遠藤敏夫 and 松岡聡}, title = {情報爆発時代へ向けた不均一アーキテクチャにおけるスーパーコンピューティング}, booktitle = {}, year = 2008, } @inproceedings{CTT100575641, author = {佐藤 仁 and 松岡聡 and 遠藤敏夫}, title = {情報爆発時代のグリッドファイルシステム上での大規模データ管理}, booktitle = {}, year = 2008, } @inproceedings{CTT100575640, author = {實本英之 and 遠藤敏夫 and 松岡聡}, title = {情報爆発に対応する耐故障性 MPI フレームワークの提案}, booktitle = {}, year = 2008, } @inproceedings{CTT100575638, author = {千葉立寛 and 遠藤敏夫 and 松岡聡}, title = {情報爆発時代のグリッド環境に対応したMPI集団通信アルゴリズムの最適化}, booktitle = {}, year = 2008, } @inproceedings{CTT100575645, author = {細萱祐人 and 遠藤敏夫 and 松岡聡}, title = {省電力ページング方式を実装した次世代メモリアーキテクチャ上での並列プログラムの評価}, booktitle = {情報処理学会 ハイパフォーマンスコンピューティングと計算科学シンポジウム(HPCS2008)}, year = 2008, } @inproceedings{CTT100574004, author = {尾形泰彦 and 遠藤敏夫 and 丸山直也 and 松岡聡}, title = {性能モデルに基づくCPU及びGPUを併用する効率的なFFTライブラリ}, booktitle = {情報処理学会 ハイパフォーマンスコンピューティングと計算科学シンポジウム(HPCS2008)}, year = 2008, } @inproceedings{CTT100575609, author = {滝澤 真一朗 and 遠藤敏夫 and 松岡聡}, title = {次世代光インターコネクトでの MPI 通信性能の評価}, booktitle = {}, year = 2007, } @inproceedings{CTT100576165, author = {佐藤 仁 and 松岡聡 and 遠藤敏夫}, title = {広域分散環境における大規模データ管理のためのノードグルーピング}, booktitle = {}, year = 2007, } @inproceedings{CTT100575608, author = {滝澤 真一朗 and 遠藤敏夫 and 松岡聡}, title = {次世代光インターコネクト上での MPI アプリケーションの評価}, booktitle = {}, year = 2007, } @inproceedings{CTT100574437, author = {尾形泰彦 and 遠藤敏夫 and 松岡聡}, title = {CPUおよびGPUを併用するFFTライブラリの提案と評価}, booktitle = {}, year = 2007, } @inproceedings{CTT100576027, author = {細萱祐人 and 遠藤敏夫 and 松岡聡}, title = {次世代省電力メモリを用いた並列プログラムの省電力化の評価}, booktitle = {}, year = 2007, } @inproceedings{CTT100576069, author = {Tatsuhiro Chiba and Toshio Endo and Satoshi Matsuoka}, title = {High-performance MPI broadcast algorithm for grid environments utilizing multi-lane NICs}, booktitle = {Proceedings of the Seventh IEEE International Symposium on Cluster Computing and the Grid (CCGrid'07)}, year = 2007, } @inproceedings{CTT100576033, author = {實本英之 and 遠藤敏夫 and 松岡聡}, title = {フォールト/リカバリモデルを考慮した耐故障性をもつMPI フレームワークABARIS の提案と評価}, booktitle = {}, year = 2007, } @inproceedings{CTT100575647, author = {Hideyuki Jitsumoto and Toshio Endo and Satoshi Matsuoka}, title = {ABARIS: An adaptable fault detection/recovery component framework for MPIs}, booktitle = {12th IEEE Workshop on Dependable Parallel, Distributed and Network-Centric Systems (DPDNS07), in conjunction with IPDPS2007}, year = 2007, } @inproceedings{CTT100576049, author = {遠藤敏夫 and 松岡聡 and 橋爪信明 and 長坂真路}, title = {ヘテロ型スーパーコンピュータTSUBAMEのLinpackによる性能評価}, booktitle = {2007年ハイパフォーマンスコンピューティングと計算科学シンポジウムHPCS2007論文集}, year = 2007, } @inproceedings{CTT100576050, author = {千葉立寛 and 遠藤敏夫 and 松岡聡}, title = {グリッド環境におけるマルチレーンを用いたMPIコレクティブ通信アルゴリズム}, booktitle = {情報処理学会 ハイパフォーマンスコンピューティングと計算科学シンポジウム(HPCS2007)}, year = 2007, } @inproceedings{CTT100576038, author = {合田憲人 and 大澤清 and 大角知孝 and 笠井武史 and 小野功 and 實本英之 and 松岡聡 and 斎藤秀雄 and 遠藤敏夫 and 横山大作 and 田浦健次朗 and 近山隆 and 田中良夫 and 下坂久司 and 梶原広輝 and 廣安知之 and 藤澤克樹}, title = {グリッドチャレンジテストベッドの構築と運用〜グリチャレテストベッドの作り方〜}, booktitle = {情報処理学会研究報告 2006-HPC-107}, year = 2006, } @inproceedings{CTT100576040, author = {遠藤敏夫 and 松岡聡 and 橋爪信明 and 長坂真路 and 後藤和茂}, title = {ヘテロ型スーパーコンピュータTSUBAMEのLinpackによる性能評価}, booktitle = {情報処理学会研究報告 2006-HPC-107}, year = 2006, } @misc{CTT100756798, author = {Satoshi Matsuoka and Toshio Endo and Akira Nukada and Shinichi Miura and Akihiro Nomura and Hitoshi Sato and Hideyuki Jitsumoto and Aleksandr Drozd.}, title = {Overview of TSUBAME3.0, Green Cloud Supercomputer for Convergence of HPC, AI and Big-Data .}, year = 2017, } @misc{CTT100687009, author = {遠藤敏夫 and 額田彰 and 松岡聡}, title = {超省エネスーパーコンピュータTSUBAME}, year = 2014, } @misc{CTT100687010, author = {遠藤敏夫 and 額田彰 and 松岡聡}, title = {TSUBAME-KFC: 液浸冷却を用いた世界一省エネなスーパーコンピュータ}, year = 2014, } @misc{CTT100721909, author = {渡辺 治 and 遠藤 敏夫}, title = {スーパーコンピューティングコンテスト・2013}, year = 2014, } @misc{CTT100686999, author = {藤澤克樹 and 遠藤敏夫}, title = {大規模半正定値計画問題に対する内点法アルゴリズムの高速計算}, year = 2012, } @misc{CTT100632834, author = {遠藤敏夫}, title = {ペタスケールグリーンスパコンTSUBAME2.0}, year = 2011, } @misc{CTT100617877, author = {松岡聡 and 遠藤敏夫 and 丸山直也 and 佐藤仁 and 滝澤真一朗}, title = {TSUBAME2.0の全貌}, year = 2010, } @misc{CTT100617875, author = {松岡聡 and 青木尊之 and 遠藤敏夫 and 丸山直也 and 佐藤仁 and 滝澤真一朗 and 實本英之}, title = {TSUBAMEの造り方から探る PCクラスターと「スパコン」のあいだ}, year = 2010, } @misc{CTT100573980, author = {遠藤敏夫}, title = {東京工業大学TSUBAMEにおけるアクセラレータ活用事例}, year = 2009, }