@book{CTT100686327, author = {Mustafa AbdulJabbar and Rio Yokota}, title = {N-body methods}, publisher = {Morgan Kaufmann}, year = 2014, } @book{CTT100686328, author = {Rio Yokota and Lorena Barba}, title = {Treecode and fast multipole method for N-body simulation with CUDA}, publisher = {Morgan Kaufmann}, year = 2011, } @article{CTT100922800, author = {戸井田 一聖 and 西口 浩司 and 千葉 直也 and 和田 有司 and 横田 理央 and 干場 大也 and 加藤 準治}, title = {構造力学を考慮した3次元形状深層生成モデルの提案}, journal = {日本計算工学会論文集}, year = 2024, } @article{CTT100905175, author = {Hiroki Naganuma and Kartik Ahuja and Shiro Takagi and Tetsuya Motokawa and Rio Yokota and Kohta Ishikawa and Ikuro Sato and Ioannis Mitliagkas}, title = {Empirical Study on Optimizer Selectionfor Out-of-Distribution GeneralizationAbstract}, journal = {Transactions on Machine Learning Research}, year = 2023, } @article{CTT100872027, author = {Muhammad Ridwan Apriansyah and Rio Yokota}, title = {Parallel QR Factorization of Block Low-Rank Matrices}, journal = {ACM Transactions on Mathematical Software}, year = 2022, } @article{CTT100867097, author = {Hiroyuki Ootomo and Rio Yokota}, title = {Recovering single precision accuracy from Tensor Cores while surpassing the FP32 theoretical peak performance}, journal = {The International Journal of High Performance Computing Application}, year = 2022, } @article{CTT100862742, author = {Tingyu Wang and Rio Yokota and Lorena A. Barba}, title = {ExaFMM: a high-performance fast multipole method library with C++ and Python interfaces}, journal = {The Journal of Open Source Software}, year = 2021, } @article{CTT100832475, author = {Davoud S. Shamshirgar and Rio Yokota and Anna-Karin Tornberg and Berk Hess}, title = {Regularizing the Fast Multipole Method for use in Molecular Simulation}, journal = {Journal of Chemical Physics}, year = 2020, } @article{CTT100832594, author = {Kazuki Osawa and Yohei Tsuji and Yuichiro Ueno and Akira Naruse and Chuan-Sheng Foo and Rio Yokota}, title = {Scalable and Practical Natural Gradient for Large-Scale Deep Learning}, journal = {IEEE Transactions on Pattern Analysis and Machine Intelligence}, year = 2020, } @article{CTT100815367, author = {横田理央}, title = {巨大行列とAI}, journal = {数学セミナー}, year = 2020, } @article{CTT100815366, author = {横田理央}, title = {スーパーコンピューティングコンテスト2019}, journal = {数学セミナー}, year = 2020, } @article{CTT100811319, author = {Akihiro Ida and Hiroshi Nakashima and Tasuku Hiraishi and Ichitaro Yamazaki and Rio Yokota and Takeshi Iwashita}, title = {QR Factorization of Block Low-rank Matrices with Weak Admissibility Condition}, journal = {Journal of Information Processing}, year = 2019, } @article{CTT100807737, author = {Ichitaro Yamazaki and Akihiro Ida and Rio Yokota and Jack Dongarra}, title = {Distributed Memory Lattice H-matrix Factorization}, journal = {The International Journal of High Performance Computing Applications}, year = 2019, } @article{CTT100815304, author = {Mustafa AbdulJabbar and Mohammed Al Farhan and Noha Al-Harthi and Rui Chen and Rio Yokota and Hakan Bagci and David Keyes}, title = {Extreme Scale FMM-Accelerated Boundary Integral Equation Solver for Wave Scattering}, journal = {SIAM Journal on Scientific Computing}, year = 2019, } @article{CTT100781338, author = {Naoya Maruyama and Takayuki Aoki and Kenjiro Taura and Rio Yokota and Mohamed Wahib and Motohiko Matsuda and Keisuke Fukuda and Takashi Shimokawabe and Naoyuki Onodera and Michel Müller and Shintaro Iwasaki}, title = {Highly Productive, High-Performance Application Frameworks for Post-Petascale Computing}, journal = {Advanced Software Technologies for Post-Peta Scale Computing}, year = 2018, } @article{CTT100760854, author = {Huda Ibeid and Rio Yokota and Jennifer Pestana and David Keyes}, title = {Fast Multipole Preconditioners for Sparse Matrices Arising from Elliptic Equations}, journal = {Computing and Visualization in Science}, year = 2017, } @article{CTT100734509, author = {横田理央}, title = {FMM と H^2(HSS) 行列のトレードオフについて}, journal = {計算工学}, year = 2016, } @article{CTT100734510, author = {横田理央}, title = {大規模境界要素法解析における分散並列 FMM の通信最適化}, journal = {シミュレーション}, year = 2016, } @article{CTT100718789, author = {Huda Ibeid and Rio Yokota and David Keyes}, title = {A performance model for the communication in fast multipole methods on high-performance computing platforms}, journal = {International Journal of High Performance Computing Applications}, year = 2016, } @article{CTT100791168, author = {Abdelhalim Amer and Satoshi Matsuoka and Miquel Pericàs and Naoya Maruyama and Kenjiro Taura and Rio Yokota and Pavan Balaji}, title = {Scaling FMM with data-driven OpenMP tasks on multicore architectures}, journal = {Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics)}, year = 2016, } @article{CTT100718790, author = {Julio Castrillon-Candas and Marc Genton and Rio Yokota}, title = {Multi-level restricted maximum likelihood covariance estimation and kriging for large non-gridded spatial datasets}, journal = {Spatial Statistics}, year = 2015, } @article{CTT100686122, author = {Rio Yokota and George Turkiyyah and David E. Keyes}, title = {Communication complexity of the fast multipole method and its algebraic variants}, journal = {Supercomputing Frontiers and Innovations}, year = 2014, } @article{CTT100686123, author = {Yousuke Ohno and Rio Yokota and Hiroshi Koyama and Gentaro Morimoto and Aki Hasegawa and Gen Masumoto and Noriaki Okimoto and Yoshinori Hirano and Huda Ibeid and Tetsu Narumi and Makoto Taiji}, title = {Petascale molecular dynamics simulation using the fast multipole method on K computer}, journal = {Computer Physics Communications}, year = 2014, } @article{CTT100686124, author = {Hatem Ltaief and Rio Yokota}, title = {Data-driven execution of fast multipole methods}, journal = {Concurrency and Computation: Practice and Experience}, year = 2013, } @article{CTT100686125, author = {Rio Yokota}, title = {An FMM based on dual tree traversal for many-core architectures}, journal = {Journal of Algorithms and Computational Technology}, year = 2013, } @article{CTT100686126, author = {Rio Yokota and Lorena Barba and Tetsu Narumi and Kenji Yasuoka}, title = {Petascale turbulence simulation using a highly parallel fast multipole method}, journal = {Computer Physics Communications}, year = 2012, } @article{CTT100686127, author = {Rio Yokota and Lorena Barba}, title = {FMM-based vortex method for simulation of isotropic turbulence on GPUs, compared with a spectral method}, journal = {Computers and Fluids}, year = 2012, } @article{CTT100686129, author = {Rio Yokota and Lorena Barba}, title = {Hierarchical N-body simulations with auto-tuning for heterogeneous systems}, journal = {Computing in Science and Engineering}, year = 2012, } @article{CTT100686128, author = {Rio Yokota and Lorena Barba}, title = {A Tuned and scalable fast multipole method as a preeminent algorithm for exascale systems}, journal = {International Journal of High Performance Computing Applications}, year = 2012, } @article{CTT100686130, author = {Jaydeep Bardhan and R. Yokota and Matthew Knepley and Lorena Barba and Tsuyoshi Hamada}, title = {Biomolecular electrostatics using a fast multipole BEM on up to 512 GPUs and a billion unknowns}, journal = {Computer Physics Communications}, year = 2011, } @article{CTT100686325, author = {Rio Yokota and Shinnosuke Obi}, title = {Vortex methods for the simulation of turbulent flows}, journal = {Journal of Fluid Science and Technology}, year = 2011, } @article{CTT100686131, author = {Rio Yokota and Lorena Barba}, title = {Comparing the treecode with FMM on GPUs for vortex particle simulations of a leapfrogging vortex ring}, journal = {Computers and Fluids}, year = 2010, } @article{CTT100686135, author = {Rio Yokota and Lorena Barba and Matthew Knepley}, title = {PetRBF–A parallel O(N) algorithm for radial basis function interpolation with Gaussians}, journal = {Computer Methods in Applied Mechanics and Engineering}, year = 2010, } @article{CTT100686134, author = {Rio Yokota and Shinnosuke Obi}, title = {Comparing vortex methods and finite difference methods in a homogeneous turbulent shear flow}, journal = {International Journal for Numerical Methods in Fluids}, year = 2009, } @article{CTT100686136, author = {Rio Yokota and Tetsu Narumi and Ryuji Sakamaki and Shun Kameoka and Shinnosuke Obi and Kenji Yasuoka}, title = {Fast multipole methods on a cluster of GPUs for the meshless simulation of turbulence}, journal = {Computer Physics Communications}, year = 2009, } @article{CTT100686137, author = {Rio Yokota and Tarun Kumar Sheel and Shinnosuke Obi}, title = {Calculation of isotropic turbulence using a pure Lagrangian vortex method}, journal = {Journal of Computational Physics}, year = 2007, } @inproceedings{CTT100922690, author = {藤井 一喜 and 中村 泰士 and Mengsay Loem and 飯田 大貴 and 大井 聖也 and 服部 翔 and 平井 翔太 and 水木 栄 and 横田 理央 and 岡崎 直観}, title = {継続事前学習による日本語に強い大規模言語モデルの構築}, booktitle = {}, year = 2024, } @inproceedings{CTT100922687, author = {水木 栄 and 飯田 大貴 and 藤井 一喜 and 中村 泰士 and Mengsay Loem and 大井 聖也 and 服部 翔 and 平井 翔太 and 横田 理央 and 岡崎 直観}, title = {大規模言語モデルの日本語能力の効率的な強化: 継続事前学習における語彙拡張と対訳コーパスの活用}, booktitle = {}, year = 2024, } @inproceedings{CTT100922686, author = {岡崎 直観 and 服部 翔 and 平井 翔太 and 飯田 大貴 and 大井 聖也 and 藤井 一喜 and 中村 泰士 and Mengsay Loem and 横田 理央 and 水木 栄}, title = {Swallowコーパス: 日本語大規模ウェブコーパス}, booktitle = {}, year = 2024, } @inproceedings{CTT100906352, author = {Tomoya Takahashi and Shingo Yashima and Kohta Ishikawa and Ikuro Sato and Rio Yokota}, title = {Pixel-level Contrastive Learning of Driving Videos with Optical Flow}, booktitle = {Proc. CVPR workshop 2023}, year = 2023, } @inproceedings{CTT100921055, author = {浅倉 拓也 and 井上中順 and 横田 理央 and 篠田 浩一}, title = {受容野の自動最適化によるモードに適応的なTransformerの開発}, booktitle = {人工知能学会全国大会 (第37回)論文集}, year = 2023, } @inproceedings{CTT100890866, author = {Aoyu Li and Ikuro Sato and Kohta Ishikawa and Rei Kawakami and Rio Yokota}, title = {Informative Sample-Aware Proxy for Deep Metric Learning}, booktitle = {}, year = 2022, } @inproceedings{CTT100895747, author = {RYU TADOKORO and Kataoka Hirokatsu and 川上 玲 and 横田 理央 and 井上 中順}, title = {蒸留画像による事前学習効果についての検討}, booktitle = {講演論文集}, year = 2022, } @inproceedings{CTT100874414, author = {Qianxiang Ma and Sameer Deshmukh and Rio Yokota}, title = {Scalable Linear Time Dense Direct Solver for 3-D Problems Without Trailing Sub-Matrix Dependencies}, booktitle = {}, year = 2022, } @inproceedings{CTT100890864, author = {Hiroki Naganuma and Kartik Ahuja and Ioannis Mitliagkas and Shiro Takagi and Tetsuya Motokawa and Rio Yokota and Kohta Ishikawa and Ikuro Sato}, title = {Empirical Study on Optimizer Selection for Out-of-Distribution Generalization}, booktitle = {Proc. NeurIPS 2022}, year = 2022, } @inproceedings{CTT100882020, author = {伊田 明弘 and 荻田 武史 and 伊田 明弘 and 荻田 武史 and 横田 理央}, title = {対称ブロック低ランク行列の精度保証付き固有値問題解法}, booktitle = {}, year = 2022, } @inproceedings{CTT100881749, author = {Rio Yokota}, title = {Matrices in Deep Neural Networks and How to Compute Them in Parallel}, booktitle = {}, year = 2022, } @inproceedings{CTT100890860, author = {高橋那弥 and 八嶋晋吾 and 石川康太 and 佐藤育郎 and 横田理央}, title = {走行動画の大規模自己教師あり学習の検討と計画}, booktitle = {MIRUブックレット}, year = 2022, } @inproceedings{CTT100890854, author = {Aoyu Li and Ikuro Sato and 石川康太 and Rei Kawakami and Rio Yokota}, title = {Informative Sample-Aware Proxy for Deep Metric Learning}, booktitle = {MIRUブックレット}, year = 2022, } @inproceedings{CTT100866763, author = {Hirokatsu Kataoka and Ryo Hayamizu and Ryosuke Yamada and Kodai Nakashima and Sora Takashima and Xinyu Zhang and Edgar Josafat Martinez-Noriega and Nakamasa Inoue and Rio Yokota}, title = {Replacing Labeled Real-image Datasets with Auto-generated Contours}, booktitle = {}, year = 2022, } @inproceedings{CTT100865536, author = {Hana Hoshino and Kei Ota and Asako Kanezaki and Rio Yokota}, title = {OPIRL: Sample Efficient Off-Policy Inverse Reinforcement Learning via Distribution Matching}, booktitle = {}, year = 2022, } @inproceedings{CTT100869127, author = {Thomas Spendlhofer and Rio Yokota}, title = {Iterative Refinement with Hierarchical Low-rank Preconditioners Using Mixed Precision}, booktitle = {}, year = 2022, } @inproceedings{CTT100869126, author = {Muhammad Ridwan Apriansyah and Rio Yokota}, title = {Parallel QR Factorization of Block Low-rank Matrices}, booktitle = {}, year = 2022, } @inproceedings{CTT100869125, author = {Sameer Satish Deshmukh and Rio Yokota}, title = {Acceleration of O(N) Solvers for Large Dense Matrices}, booktitle = {}, year = 2022, } @inproceedings{CTT100866867, author = {中村秋海 and 横田理央}, title = {Vision Transformerにおけるバッチサイズの汎化性能への影響}, booktitle = {}, year = 2022, } @inproceedings{CTT100866866, author = {石井央 and 横田理央}, title = {深層学習における2次最適化の汎化性能の検証}, booktitle = {}, year = 2022, } @inproceedings{CTT100860388, author = {Shun Iwase and Xingyu Liu and Rawal Khirodkar and Rio Yokota and Kris M. Kitani}, title = {RePOSE: Real-Time Iterative Rendering and Refinement for 6D Object Pose Estimation}, booktitle = {}, year = 2021, } @inproceedings{CTT100862737, author = {Rio Yokota}, title = {Approximations of Natural Gradient Descent in Distributed Training}, booktitle = {}, year = 2021, } @inproceedings{CTT100862738, author = {横田 理央}, title = {二次最適化を用いた分散並列深層学習}, booktitle = {}, year = 2021, } @inproceedings{CTT100862739, author = {横田 理央}, title = {階層的低ランク近似法に関するレビュー}, booktitle = {}, year = 2021, } @inproceedings{CTT100854272, author = {Yuichiro Ueno and Kazuki Osawa and Yohei Tsuji and Akira Naruse and Rio Yokota}, title = {Rich Information is Affordable: A Systematic Performance Analysis of Second-order Optimization Using K-FAC}, booktitle = {}, year = 2021, } @inproceedings{CTT100862736, author = {Hikaru Nakata and Nakamasa Inoue and Rio Yokota}, title = {Self-supervised Continual Pretraining for Class Incremental Image Classification}, booktitle = {Proc. CVPR CLVISION Workshop (Findings)}, year = 2021, } @inproceedings{CTT100862740, author = {横田 理央}, title = {スパコンを用いた大規模並列分散深層学習}, booktitle = {}, year = 2021, } @inproceedings{CTT100862741, author = {横田 理央}, title = {深層学習におけるヘッセ行列,フィッシャー行列,共分散行列の高速近似解法}, booktitle = {}, year = 2020, } @inproceedings{CTT100835680, author = {Rio Yokota}, title = {Degree of Approximation and Overhead of Computing Curvature}, booktitle = {}, year = 2020, } @inproceedings{CTT100832593, author = {Hiroyuki Ootomo and Rio Yokota}, title = {Randomized SVD on TensorCores}, booktitle = {}, year = 2020, } @inproceedings{CTT100832592, author = {Sameer Deshmukh and Rio Yokota}, title = {Distributed Memory Task-Based Block Low Rank Direct Solver}, booktitle = {}, year = 2020, } @inproceedings{CTT100835684, author = {中田 光 and 横田 理央}, title = {画像分類のための継続的な事前学習における教師なし表現学習の堅牢性に関する検証}, booktitle = {}, year = 2020, } @inproceedings{CTT100835682, author = {Rio Yokota and Yohei Tsuji and Kazuki Osawa}, title = {Second Order Optimization for Distributed Data-parallel Deep Learning on 4000 GPUs}, booktitle = {}, year = 2020, } @inproceedings{CTT100835685, author = {大友広幸 and 横田理央}, title = {TensorコアのAPIの構造解析を用いた拡張ライブラリの開発}, booktitle = {}, year = 2020, } @inproceedings{CTT100835686, author = {所畑貴大 and 長沼大樹 and 横田理央}, title = {確率的重み付け平均法のラージバッチ学習における有用性の検証}, booktitle = {}, year = 2020, } @inproceedings{CTT100835687, author = {横田理央}, title = {二次最適化を用いた巨大な言語モデルの学習およびFRNNを用いたプラズマ挙動予測}, booktitle = {}, year = 2020, } @inproceedings{CTT100832477, author = {Rise Ooi and Takeshi Iwashita and Takeshi Fukaya and Akihiro Ida and Rio Yokota}, title = {Effect of Mixed Precision Computing on H-Matrix Vector Multiplication in BEM Analysis}, booktitle = {Proceedings of HPC Asia 2020}, year = 2020, } @inproceedings{CTT100821422, author = {Muhammad Ridwan Apriansyah and Rio Yokota}, title = {QR Decomposition of Block Low-Rank Matrices}, booktitle = {}, year = 2020, } @inproceedings{CTT100821421, author = {Sameer Deshmukh and Rio Yokota}, title = {Distributed Memory Task-Based Block Low Rank Direct Solver}, booktitle = {}, year = 2020, } @inproceedings{CTT100803976, author = {Kazuki Osawa and Siddarth Swaroop and Anirudh Jain and Runa Eschenhagen and Richard E. Turner and Rio Yokota and Mohammad Emtiyaz Khan}, title = {Practical Deep Learning with Bayesian Principles}, booktitle = {}, year = 2019, } @inproceedings{CTT100821423, author = {Hiroyuki Ootomo and Rio Yokota}, title = {TSQR on TensorCores}, booktitle = {}, year = 2019, } @inproceedings{CTT100821426, author = {Hiroki Naganuma and Rio Yokota}, title = {On Empirical Analysis of Layer-wised Learning Rate Schedule}, booktitle = {}, year = 2019, } @inproceedings{CTT100821424, author = {Qianxing Ma and Rio Yokota}, title = {Runtime System for GPU-based Hierarchical LU factorization}, booktitle = {}, year = 2019, } @inproceedings{CTT100819712, author = {八島慶汰 and 石川康太 and 佐藤育郎 and 野村哲弘 and 横田理央 and 松岡聡}, title = {早期終了タイミングを予測する:深層学習における確率勾配の分布の変化点検出}, booktitle = {}, year = 2019, } @inproceedings{CTT100807736, author = {Satoshi Ohshima and Ichitaro Yamazaki and Akihiro Ida and Rio Yokota}, title = {Optimization of Numerous Small Dense-Matrix–Vector Multiplications in H-matrix Arithmetic on GPU}, booktitle = {}, year = 2019, } @inproceedings{CTT100821425, author = {大友 広幸 and 横田 理央}, title = {Tensorコアを用いたTSQR}, booktitle = {}, year = 2019, } @inproceedings{CTT100815305, author = {Yohei Tsuji and Kazuki Osawa and Yuichiro Ueno and Akira Naruse and Rio Yokota and Satoshi Matsuoka}, title = {Performance Optimizations and Analysis of Distributed Deep Learning with Approximated Second-Order Optimization Method}, booktitle = {Proceedings of the 48th International Conference on Parallel Processing: Workshops}, year = 2019, } @inproceedings{CTT100802443, author = {Peter Spalthoff and 横田 理央}, title = {Flexible and Simplistic Hierarchical Matrix-Based Fast Direct Solver}, booktitle = {}, year = 2019, } @inproceedings{CTT100802444, author = {大友 広幸 and 横田 理央}, title = {Tensorコアを用いたTSQRのGPU実装}, booktitle = {}, year = 2019, } @inproceedings{CTT100793663, author = {Kazuki Osawa and Yohei Tsuji and Yuichiro Ueno and Akira Naruse and Rio Yokota and Satoshi Matsuoka}, title = {Second-order Optimization Method for Large Mini-batch: Training ResNet-50 on ImageNet in 35 Epochs}, booktitle = {}, year = 2019, } @inproceedings{CTT100793662, author = {長沼 大樹 and 横田 理央}, title = {ラージバッチ学習のための自然勾配学習法におけるSmoothingの有効性}, booktitle = {}, year = 2019, } @inproceedings{CTT100835681, author = {Rio Yokota}, title = {Recent Trends in Hierarchical Low-Rank Approximation Methods}, booktitle = {}, year = 2019, } @inproceedings{CTT100793660, author = {Yuichiro Ueno and Rio Yokota}, title = {Exhaustive Study of Hierarchical AllReduce Patterns for Large Messages Between GPUs}, booktitle = {}, year = 2019, } @inproceedings{CTT100793661, author = {Hiroki Naganuma and Rio Yokota}, title = {A Performance Improvement Approach for Second-Order Optimization in Large Mini-batch Training}, booktitle = {}, year = 2019, } @inproceedings{CTT100793658, author = {横田理央 and 大沢和樹 and 辻陽平 and 上野裕一郎 and 成瀬彰}, title = {大規模並列深層学習における2次の最適化手法の効果}, booktitle = {}, year = 2019, } @inproceedings{CTT100793659, author = {長沼 大樹 and 横田 理央}, title = {ノイズ注入による平均化を用いたラージバッチ学習の汎化性能改善手法の検討}, booktitle = {}, year = 2019, } @inproceedings{CTT100793657, author = {大沢和樹 and 横田理央 and Chuan-Sheng Foo and Vijay Chandrasekhar}, title = {Fisher情報行列の解析に基づく大規模深層学習のための二次最適化手法}, booktitle = {}, year = 2019, } @inproceedings{CTT100793655, author = {中田光 and 大沢和樹 and 横田理央}, title = {自然勾配法に基づく変分深層学習}, booktitle = {}, year = 2019, } @inproceedings{CTT100793654, author = {大友広幸 and 横田理央}, title = {Tensorコアを用いたBatched QR分解}, booktitle = {}, year = 2019, } @inproceedings{CTT100793653, author = {長沼大樹 and 横田理央}, title = {大規模並列深層学習のための目的関数の平滑化}, booktitle = {}, year = 2019, } @inproceedings{CTT100835683, author = {Rio Yokota}, title = {Kronecker Factorization for Second Order Optimization in Deep Learning}, booktitle = {}, year = 2019, } @inproceedings{CTT100773722, author = {Rio Yokota}, title = {Optimization Methods for Large Scale Distributed Deep Learning}, booktitle = {}, year = 2018, } @inproceedings{CTT100771718, author = {長沼大樹 and 岩瀬 駿 and 郭 林昇 and 中田 光 and 横田 理央}, title = {自然勾配近似法を用いた大規模並列深層学習におけるハイパーパラメータ最適化}, booktitle = {}, year = 2018, } @inproceedings{CTT100773723, author = {Rio Yokota}, title = {Early Application Results on TSUBAME 3}, booktitle = {}, year = 2018, } @inproceedings{CTT100773724, author = {Rio Yokota}, title = {Scaling Deep Learning to Thousands of GPUs}, booktitle = {}, year = 2018, } @inproceedings{CTT100773725, author = {Rio Yokota}, title = {Energy Conserving Fast Multipole Methods for the Calculation of Long-range Interactions}, booktitle = {}, year = 2018, } @inproceedings{CTT100759345, author = {Ichitaro Yamazaki and Ahmad Abdelfattah and Akihiro Ida and Satoshi Ohshima and Stanimire Tomov and Rio Yokota and Jack Dongarra}, title = {Analyzing Performance of BiCGStab with Hierarchical Matrix on GPU clusters}, booktitle = {}, year = 2018, } @inproceedings{CTT100773726, author = {Rio Yokota}, title = {Can we use Hierarchical Low-Rank Approximation for Deep Learning?}, booktitle = {}, year = 2018, } @inproceedings{CTT100759344, author = {大友広幸 and 大沢和樹 and 横田理央}, title = {フィッシャー情報行列のクロネッカー因子分解を用いた深層学習}, booktitle = {}, year = 2018, } @inproceedings{CTT100760853, author = {大友 広幸 and 大沢 和樹 and 横田 理央}, title = {フィッシャー情報行列のクロネッカー因子分解を用いた深層ニューラルネットワークの分散学習}, booktitle = {}, year = 2018, } @inproceedings{CTT100759346, author = {Satoshi Ohshima and Ichitaro Yamazaki and Akihiro Ida and Rio Yokota}, title = {Optimization of Hierarchical Matrix Computation on GPU}, booktitle = {}, year = 2018, } @inproceedings{CTT100759343, author = {桑村祐二 and 大沢和樹 and 横田理央}, title = {自然勾配法の近似手法における学習パラメータの調整}, booktitle = {}, year = 2018, } @inproceedings{CTT100759341, author = {Hiroki Naganuma and Rio Yokota}, title = {Accelerating Convolutional Neural Networks Using Low Precision Arithmetic}, booktitle = {}, year = 2018, } @inproceedings{CTT100759338, author = {長沼大樹 and 横田理央}, title = {畳み込みニューラル ネットワークにおける低精度演算を用いた高速化の検証}, booktitle = {}, year = 2017, } @inproceedings{CTT100755398, author = {大沢和樹 and 関谷翠 and 長沼大樹 and 横田理央}, title = {低ランクテンソル分解を用いた畳み込みニューラルネットワークの高速化}, booktitle = {}, year = 2017, } @inproceedings{CTT100755397, author = {長沼大樹 and 関谷翠 and 大沢和樹 and 大友広幸 and 桑村裕二 and 横田理央}, title = {深層学習における低精度演算を用いた高速化及びアクセラレーターの性能評価}, booktitle = {}, year = 2017, } @inproceedings{CTT100751154, author = {Kazuki Oosawa and Rio Yokota}, title = {Evaluating the Compression Efficiency of the Filters in Convolutional Neural Networks}, booktitle = {}, year = 2017, } @inproceedings{CTT100755396, author = {長沼大樹 and 大沢和樹 and 関谷翠 and 横田理央}, title = {深層学習における半精度演算を用いた圧縮モデルの高速化}, booktitle = {}, year = 2017, } @inproceedings{CTT100751153, author = {Mustafa AbdulJabbar and Mohammed Al Farhan and Rio Yokota and David Keyes}, title = {Performance Evaluation of Computation and Communication Kernels of the Fast Multipole Method on Intel Manycore Architecture}, booktitle = {}, year = 2017, } @inproceedings{CTT100751142, author = {Kazuki Oosawa and Akira Sekiya and Hiroki Naganuma and Rio Yokota}, title = {Accelerating Matrix Multiplication in Deep Learning by Using Low-Rank Approximation}, booktitle = {}, year = 2017, } @inproceedings{CTT100751150, author = {大島 聡史 and 山崎 市太郎 and 伊田 明弘 and 横田理央}, title = {GPUクラスタ上における階層型行列計算の最適化}, booktitle = {}, year = 2017, } @inproceedings{CTT100751139, author = {Mustafa AbdulJabbar and George Markomanolis and Huda Ibeid and Rio Yokota and David Keyes}, title = {Communication Reducing Algorithms for Distributed Heirarchical N-Body Methods}, booktitle = {Lecture Notes in Computer Science}, year = 2017, } @inproceedings{CTT100751140, author = {Rio Yokota}, title = {Hierarchical Low-Rank Approximations at Extreme Scale}, booktitle = {}, year = 2017, } @inproceedings{CTT100751136, author = {大沢和樹 and 関谷翠 and 長沼大樹 and 横田理央}, title = {畳み込みニューラルネットワークの低ランク近似を用いた高速化}, booktitle = {計算工学講演会論文集 Vol.22}, year = 2017, } @inproceedings{CTT100751133, author = {関谷翠 and 大沢和樹 and 長沼大樹 and 横田理央}, title = {低ランク近似を用いた深層学習の行列積の高速化}, booktitle = {}, year = 2017, } @inproceedings{CTT100737180, author = {本山 義史 and 遠藤 敏夫 and 松岡 聡 and 横田 理央 and 福田 圭祐 and 佐藤 育郎}, title = {低ランク近似行列によるCNNにおける畳み込み演算の最適化}, booktitle = {2017-HPC-158 No.25}, year = 2017, } @inproceedings{CTT100751127, author = {Rio Yokota}, title = {Energy Conservation of Fast Multipole Methods in Classical Molecular Dynamics Simulations}, booktitle = {}, year = 2017, } @inproceedings{CTT100751129, author = {Rio Yokota}, title = {Compute-Memory Tradeoff in Hierarchical Low-Rank Approximation Methods}, booktitle = {}, year = 2017, } @inproceedings{CTT100737166, author = {Keisuke Fukuda and Motohiko Matsuda and Naoya Maruyama and Rio Yokota and Kenjiro Taura and Satoshi Matsuoka}, title = {Tapas: An Implicitly Parallel ProgrammingFramework For Hierarchical N-body Algorithms}, booktitle = {The 22nd IEEE International Conference on Parallel And Distributed Systems}, year = 2016, } @inproceedings{CTT100751126, author = {Rio Yokota}, title = {Improving Data Locality of Fast Multipole Methods}, booktitle = {}, year = 2016, } @inproceedings{CTT100718835, author = {Rio Yokota}, title = {Fast Multipole Method as a Matrix-free Hierarchical Low-rank Approximation}, booktitle = {}, year = 2016, } @inproceedings{CTT100718802, author = {横田理央}, title = {Fast Multipole Method を用いた多種アーキテクチャ向け スーパーコンピュータ用ライブラリの開発と 分子・流体シミュレーションでの評価}, booktitle = {}, year = 2016, } @inproceedings{CTT100718803, author = {横田理央}, title = {FMMの性能の可搬性}, booktitle = {}, year = 2016, } @inproceedings{CTT100751123, author = {Huda Ibeid and Rio Yokota and David Keyes}, title = {A Matrix-Free Preconditioner for Elliptic Solvers Based on the Fast Multipole Method}, booktitle = {}, year = 2016, } @inproceedings{CTT100718829, author = {Rio Yokota}, title = {A Common API for Fast Multipole Methods}, booktitle = {}, year = 2016, } @inproceedings{CTT100751125, author = {横田理央}, title = {FMMの自動チューニング可能なパラメータについて}, booktitle = {}, year = 2015, } @inproceedings{CTT100718833, author = {Rio Yokota and Francois-Henri Rouet and Xiaoye Sherry Li}, title = {Comparison of FMM and HSS at Large Scale}, booktitle = {}, year = 2015, } @inproceedings{CTT100718834, author = {Rio Yokota and Huda Ibeid and David Keyes}, title = {Preconditioning Sparse Matrices Using a Highly Scalable Fast Multipole Method}, booktitle = {}, year = 2015, } @inproceedings{CTT100751120, author = {Rio Yokota}, title = {Various Implementations of FMM and Their Performance on Future Architectures}, booktitle = {}, year = 2015, } @inproceedings{CTT100751118, author = {Huda Ibeid and Jennifer Pestana and Rio Yokota and David Keyes}, title = {Fast Multipole Method as Preconditioner}, booktitle = {}, year = 2015, } @inproceedings{CTT100718836, author = {Rio Yokota}, title = {ExaFMM -- a Testbed for Comparing Various Implementations of the FMM}, booktitle = {}, year = 2015, } @inproceedings{CTT100718842, author = {Huda Ibeid and Rio Yokota and Jennifer Pestana and David Keyes}, title = {Fast Multipole Preconditioners for Sparse Linear Solvers}, booktitle = {}, year = 2014, } @inproceedings{CTT100718843, author = {Rio Yokota and David Keyes}, title = {Communication Complexity of the Fast Multipole Method and its Algebraic Variants}, booktitle = {}, year = 2014, } @inproceedings{CTT100718845, author = {Hatem Ltaief and Rio Yokota}, title = {High Performance Numerical Algorithms for Seismic and Reservoir Simulations}, booktitle = {}, year = 2014, } @inproceedings{CTT100718846, author = {Rio Yokota}, title = {Fast N-body Methods as a Compute-Bound Preconditioner for Sparse Solvers on GPUs}, booktitle = {}, year = 2014, } @inproceedings{CTT100759347, author = {Abdelhalim Amer and Naoya Maruyama and Miquel Pericas and Kenjiro Taura and Rio Yokota and Satoshi Matsuoka}, title = {Fork-Join and Data-Driven Execution Models on Multi-core Architectures: Case Study of the FMM}, booktitle = {Lecture notes in computer science, LNCS}, year = 2013, } @inproceedings{CTT100718848, author = {Jennifer Pestana and Rio Yokota and Huda Ibeid and David Keyes}, title = {Fast Multipole Method Preconditioning}, booktitle = {}, year = 2013, } @inproceedings{CTT100718851, author = {Rio Yokota}, title = {Advances in Fast Multipole Methods for Scalable Electrostatics Calculations}, booktitle = {}, year = 2013, } @inproceedings{CTT100718852, author = {Abdul Abdelfatteh and Hatem Ltaief and Rio Yokota}, title = {Investigating New Numerical Techniques for Reservoir Simulations on GPUs}, booktitle = {}, year = 2013, } @inproceedings{CTT100718855, author = {Huda Ibeid and Rio Yokota and David Keyes}, title = {Fast Multipole Method as a Preconditioner}, booktitle = {}, year = 2013, } @inproceedings{CTT100718860, author = {Kenjiro Taura and Jun Nakashima and Rio Yokota and Naoya Maruyama}, title = {A Task Parallelism Meets Fast Multipole Methods}, booktitle = {}, year = 2012, } @inproceedings{CTT100718863, author = {Rio Yokota}, title = {Petascale Fast Multipole Methods on GPUs}, booktitle = {}, year = 2012, } @inproceedings{CTT100718866, author = {Rio Yokota}, title = {Petascale Fast Multipole Methods on GPUs}, booktitle = {}, year = 2012, } @inproceedings{CTT100718871, author = {Hatem Ltaief and Rio Yokota}, title = {Data-Driven Fast Multipole Method on Distributed Memory Systems with Hardware Accelerators}, booktitle = {}, year = 2012, } @inproceedings{CTT100718868, author = {Enas Yunis and Rio Yokota and Aron Ahmadia}, title = {Scalable Force Directed Graph Layout Algorithms Using Fast Multipole Methods}, booktitle = {}, year = 2012, } @inproceedings{CTT100718874, author = {Rio Yokota and Lorena Barba}, title = {Recent Trends in Hierarchical N-body Methods on GPUs}, booktitle = {}, year = 2012, } @inproceedings{CTT100718876, author = {Rio Yokota and Tetsu Narumi and Lorena Barba and Kenji Yasuoka}, title = {Scaling Fast Multipole Methods up to 4000 GPUs}, booktitle = {}, year = 2012, } @inproceedings{CTT100718878, author = {Hoang Vu Nguyen and Rio Yokota and Georgiy Stenchikov}, title = {A Parallel Numerical Simulation of Dust Particles Using Direct Numerical Simulation}, booktitle = {}, year = 2012, } @inproceedings{CTT100718877, author = {Rio Yokota}, title = {Running Fast Multipole Method on the Full Node of TSUBAME and K computer}, booktitle = {}, year = 2012, } @inproceedings{CTT100718882, author = {Rio Yokota}, title = {Fast N-body Methods on Many-core and Heterogenous Systems}, booktitle = {}, year = 2012, } @inproceedings{CTT100718885, author = {Rio Yokota}, title = {Petaflops Scale Turbulence Simulation on TSUBAME 2.0}, booktitle = {}, year = 2011, } @inproceedings{CTT100718887, author = {Tetsu Narumi and Rio Yokota and Lorena Barba and Kenji Yasuoka}, title = {Petascale Turbulence Simulation Using FMM}, booktitle = {}, year = 2011, } @inproceedings{CTT100718889, author = {Rio Yokota and Lorena Barba}, title = {Parameter Tuning of a Hybrid Treecode-FMM on GPUs}, booktitle = {}, year = 2011, } @inproceedings{CTT100718888, author = {Rio Yokota and Lorena Barba}, title = {Fast Multipole Method vs. Spectral Methods for the Simulation of Isotropic Turbulence on GPUs}, booktitle = {}, year = 2011, } @inproceedings{CTT100718890, author = {Rio Yokota and Lorena Barba}, title = {Large Scale Multi-GPU FMM for Bioelectrostatics}, booktitle = {}, year = 2011, } @inproceedings{CTT100718891, author = {Rio Yokota}, title = {12 Steps to a Fast Multipole Method on GPUs}, booktitle = {}, year = 2011, } @inproceedings{CTT100718894, author = {Rio Yokota and Jaydeep Bardhan and Matthew Knepley and Lorena Barba}, title = {(Really) Fast Macromolecular Electrostatics -- Fast Algorithms, Open Software and Accelerated Computing}, booktitle = {}, year = 2010, } @inproceedings{CTT100718895, author = {Rio Yokota and Lorena Barba}, title = {RBF Interpolation using Gaussians with Domain Decomposition on GPUs}, booktitle = {}, year = 2010, } @inproceedings{CTT100718896, author = {Rio Yokota and Lorena Barba}, title = {Performance of the Fast Multipole Method on GPUs Using Various Kernels}, booktitle = {}, year = 2010, } @inproceedings{CTT100718897, author = {Rio Yokota and Lorena Barba}, title = {Comparing the Treecode with FMM on GPUs for Vortex Particle Simulations of a Leapfrogging Vortex Ring}, booktitle = {}, year = 2010, } @inproceedings{CTT100718898, author = {Rio Yokota and Shinnosuke Obi}, title = {Lagrangian Simulation of Turbulence Using Vortex Methods}, booktitle = {}, year = 2010, } @inproceedings{CTT100718899, author = {Rio Yokota}, title = {Range of Applications for the Fast Multipole Method on GPUs}, booktitle = {}, year = 2010, } @inproceedings{CTT100718900, author = {Tsuyoshi Hamada and Rio Yokota and Keigo Nitadori and Tetsu Narumi and Kenji Yasuoka and Makoto Taiji and Kyoshi Oguri}, title = {42 TFlops Hierarchical N-Body Simulation on GPUs with Applications in Both Astrophysics and Turbulence}, booktitle = {}, year = 2009, } @inproceedings{CTT100718905, author = {横田理央 and 小尾晋之介}, title = {平行平板間乱流における渦法の検証}, booktitle = {}, year = 2009, } @inproceedings{CTT100718904, author = {Rio Yokota and Koji Fukagata and Shinnosuke Obi}, title = {Lagrangian Vortex Methods in Turbulent Channel Flows}, booktitle = {}, year = 2009, } @inproceedings{CTT100718906, author = {Rio Yokota and Tetsu Narumi and Ryuji Sakamaki and Kenji Yasuoka and Shinnosuke Obi}, title = {Fast Multipole Methods on GPUs for the Meshfree Simulation of Turbulence}, booktitle = {}, year = 2009, } @inproceedings{CTT100718907, author = {Rio Yokota and Tetsu Narumi and Ryuji Sakamaki and Shun Kameoka and Kenji Yasuoka and Shinnosuke Obi}, title = {DNS of Homogeneous Turbulence Using Vortex Methods Accelerated by the FMM on a Cluster of GPUs}, booktitle = {}, year = 2009, } @inproceedings{CTT100718908, author = {Rio Yokota and Tetsu Narumi and Ryuji Sakamaki and Shun Kameoka and Kenji Yasuoka and Shinnosuke Obi}, title = {Meshfree Simulation of Turbulence Using the Fast Multipole Methods on GPUs}, booktitle = {}, year = 2008, } @inproceedings{CTT100718909, author = {横田 理央 and 小尾 晋之介}, title = {渦法を用いた平行平板間乱流の解析}, booktitle = {}, year = 2008, } @inproceedings{CTT100718910, author = {Rio Yokota and Shinnosuke Obi}, title = {Direct Numerical Simulation of Homogeneous Shear Flow Using Vortex Methods}, booktitle = {}, year = 2008, } @inproceedings{CTT100718912, author = {Rio Yokota and Shinnosuke Obi}, title = {Mesh-Free Simulation of the Homogeneous Shear Flow Using Vortex Methods}, booktitle = {}, year = 2008, } @inproceedings{CTT100718913, author = {佐藤 彰 and 横田 理央 and 小尾 晋之介}, title = {三次元渦法による翼端渦の数値解析}, booktitle = {}, year = 2007, } @inproceedings{CTT100718915, author = {Rio Yokota and Tetsu Narumi and Kenji Yasuoka and Toshikazu Ebisuzaki and Shinnosuke Obi}, title = {MDGRAPE-3 を用いた渦法による乱流の直接数値シミュレーション}, booktitle = {}, year = 2007, } @inproceedings{CTT100718916, author = {Rio Yokota and Shinnosuke Obi}, title = {Pure Lagrangian Vortex Methods for the Simulation of Decaying Isotropic Turbulence}, booktitle = {}, year = 2007, } @inproceedings{CTT100718917, author = {横田 理央 and 小尾 晋之介}, title = {渦法による一様せん断流の解析}, booktitle = {}, year = 2007, } @inproceedings{CTT100718918, author = {横田 理央 and 小尾 晋之介}, title = {渦法によるメッシュフリー乱流解析}, booktitle = {}, year = 2007, } @inproceedings{CTT100718919, author = {横田 理央 and 小尾 晋之介}, title = {渦法による一様等方性乱流の解析}, booktitle = {}, year = 2006, } @inproceedings{CTT100718920, author = {横田 理央 and 小尾 晋之介}, title = {3次元渦法・境界要素法による流体-固体連成解析}, booktitle = {}, year = 2006, } @inproceedings{CTT100718921, author = {横田 理央 and 小尾 晋之介}, title = {渦法を用いた物体後流の3次元解析}, booktitle = {}, year = 2006, } @inproceedings{CTT100718922, author = {Rio Yokota and Shinnosuke Obi}, title = {Vortex Flow Simulation Between Multipole Bridge Decks}, booktitle = {}, year = 2006, } @inproceedings{CTT100718924, author = {横田 理央 and 小尾 晋之介}, title = {複数の鈍い形状物体周りの渦流れシミュレーション}, booktitle = {}, year = 2005, } @inproceedings{CTT100718923, author = {Rio Yokota and Shinnosuke Obi}, title = {Vortex Flow Simulation of Multipole Bluff Bodies}, booktitle = {}, year = 2005, }