@book{CTT100686327, author = {Mustafa AbdulJabbar and Rio Yokota}, title = {N-body methods}, publisher = {Morgan Kaufmann}, year = 2014, } @book{CTT100686328, author = {Rio Yokota and Lorena Barba}, title = {Treecode and fast multipole method for N-body simulation with CUDA}, publisher = {Morgan Kaufmann}, year = 2011, } @article{CTT100905175, author = {Mila - Quebec AI Institute and Université de Montréal and Independent Researcher and University of Tsukuba and Rio Yokota and Kohta Ishikawa and Ikuro Sato and Ioannis Mitliagkas}, title = {Empirical Study on Optimizer Selectionfor Out-of-Distribution GeneralizationAbstract}, journal = {Transactions on Machine Learning Research}, year = 2023, } @article{CTT100872027, author = {Muhammad Ridwan Apriansyah and Rio Yokota}, title = {Parallel QR Factorization of Block Low-Rank Matrices}, journal = {ACM Transactions on Mathematical Software}, year = 2022, } @article{CTT100867097, author = {Hiroyuki Ootomo and Rio Yokota}, title = {Recovering single precision accuracy from Tensor Cores while surpassing the FP32 theoretical peak performance}, journal = {The International Journal of High Performance Computing Application}, year = 2022, } @article{CTT100862742, author = {Tingyu Wang and Rio Yokota and Lorena A. Barba}, title = {ExaFMM: a high-performance fast multipole method library with C++ and Python interfaces}, journal = {The Journal of Open Source Software}, year = 2021, } @article{CTT100832475, author = {Davoud S. Shamshirgar and Rio Yokota and Anna-Karin Tornberg and Berk Hess}, title = {Regularizing the Fast Multipole Method for use in Molecular Simulation}, journal = {Journal of Chemical Physics}, year = 2020, } @article{CTT100832594, author = {Kazuki Osawa and Yohei Tsuji and Yuichiro Ueno and Akira Naruse and Chuan-Sheng Foo and Rio Yokota}, title = {Scalable and Practical Natural Gradient for Large-Scale Deep Learning}, journal = {IEEE Transactions on Pattern Analysis and Machine Intelligence}, year = 2020, } @article{CTT100815367, author = {Rio Yokota}, title = {巨大行列とAI}, journal = {数学セミナー}, year = 2020, } @article{CTT100815366, author = {Rio Yokota}, title = {スーパーコンピューティングコンテスト2019}, journal = {数学セミナー}, year = 2020, } @article{CTT100811319, author = {Akihiro Ida and Hiroshi Nakashima and Tasuku Hiraishi and Ichitaro Yamazaki and Rio Yokota and Takeshi Iwashita}, title = {QR Factorization of Block Low-rank Matrices with Weak Admissibility Condition}, journal = {Journal of Information Processing}, year = 2019, } @article{CTT100807737, author = {Ichitaro Yamazaki and Akihiro Ida and Rio Yokota and Jack Dongarra}, title = {Distributed Memory Lattice H-matrix Factorization}, journal = {The International Journal of High Performance Computing Applications}, year = 2019, } @article{CTT100815304, author = {Mustafa AbdulJabbar and Mohammed Al Farhan and Noha Al-Harthi and Rui Chen and Rio Yokota and Hakan Bagci and David Keyes}, title = {Extreme Scale FMM-Accelerated Boundary Integral Equation Solver for Wave Scattering}, journal = {SIAM Journal on Scientific Computing}, year = 2019, } @article{CTT100781338, author = {Naoya Maruyama and Takayuki Aoki and Kenjiro Taura and Rio Yokota and Mohamed Wahib and Motohiko Matsuda and Keisuke Fukuda and Takashi Shimokawabe and Naoyuki Onodera and Michel Müller and Shintaro Iwasaki}, title = {Highly Productive, High-Performance Application Frameworks for Post-Petascale Computing}, journal = {Advanced Software Technologies for Post-Peta Scale Computing}, year = 2018, } @article{CTT100760854, author = {Huda Ibeid and Rio Yokota and Jennifer Pestana and David Keyes}, title = {Fast Multipole Preconditioners for Sparse Matrices Arising from Elliptic Equations}, journal = {Computing and Visualization in Science}, year = 2017, } @article{CTT100734509, author = {Rio Yokota}, title = {Tradeoff Between FMM and H^2(HSS) matrices}, journal = {Journal of the Japan Society for Computational Engineering and Science}, year = 2016, } @article{CTT100734510, author = {Rio Yokota}, title = {Communication Optimization of Distributed Memory FMM for Large Scale Boundary Element Methods}, journal = {Simulation}, year = 2016, } @article{CTT100718789, author = {Huda Ibeid and Rio Yokota and David Keyes}, title = {A performance model for the communication in fast multipole methods on high-performance computing platforms}, journal = {International Journal of High Performance Computing Applications}, year = 2016, } @article{CTT100791168, author = {Abdelhalim Amer and Satoshi Matsuoka and Miquel Pericàs and Naoya Maruyama and Kenjiro Taura and Rio Yokota and Pavan Balaji}, title = {Scaling FMM with data-driven OpenMP tasks on multicore architectures}, journal = {Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics)}, year = 2016, } @article{CTT100718790, author = {Julio Castrillon-Candas and Marc Genton and Rio Yokota}, title = {Multi-level restricted maximum likelihood covariance estimation and kriging for large non-gridded spatial datasets}, journal = {Spatial Statistics}, year = 2015, } @article{CTT100686123, author = {Yousuke Ohno and Rio Yokota and Hiroshi Koyama and Gentaro Morimoto and Aki Hasegawa and Gen Masumoto and Noriaki Okimoto and Yoshinori Hirano and Huda Ibeid and Tetsu Narumi and Makoto Taiji}, title = {Petascale molecular dynamics simulation using the fast multipole method on K computer}, journal = {Computer Physics Communications}, year = 2014, } @article{CTT100686122, author = {Rio Yokota and George Turkiyyah and David E. Keyes}, title = {Communication complexity of the fast multipole method and its algebraic variants}, journal = {Supercomputing Frontiers and Innovations}, year = 2014, } @article{CTT100686125, author = {Rio Yokota}, title = {An FMM based on dual tree traversal for many-core architectures}, journal = {Journal of Algorithms and Computational Technology}, year = 2013, } @article{CTT100686124, author = {Hatem Ltaief and Rio Yokota}, title = {Data-driven execution of fast multipole methods}, journal = {Concurrency and Computation: Practice and Experience}, year = 2013, } @article{CTT100686126, author = {Rio Yokota and Lorena Barba and Tetsu Narumi and Kenji Yasuoka}, title = {Petascale turbulence simulation using a highly parallel fast multipole method}, journal = {Computer Physics Communications}, year = 2012, } @article{CTT100686127, author = {Rio Yokota and Lorena Barba}, title = {FMM-based vortex method for simulation of isotropic turbulence on GPUs, compared with a spectral method}, journal = {Computers and Fluids}, year = 2012, } @article{CTT100686128, author = {Rio Yokota and Lorena Barba}, title = {A Tuned and scalable fast multipole method as a preeminent algorithm for exascale systems}, journal = {International Journal of High Performance Computing Applications}, year = 2012, } @article{CTT100686129, author = {Rio Yokota and Lorena Barba}, title = {Hierarchical N-body simulations with auto-tuning for heterogeneous systems}, journal = {Computing in Science and Engineering}, year = 2012, } @article{CTT100686130, author = {Jaydeep Bardhan and R. Yokota and Matthew Knepley and Lorena Barba and Tsuyoshi Hamada}, title = {Biomolecular electrostatics using a fast multipole BEM on up to 512 GPUs and a billion unknowns}, journal = {Computer Physics Communications}, year = 2011, } @article{CTT100686325, author = {Rio Yokota and Shinnosuke Obi}, title = {Vortex methods for the simulation of turbulent flows}, journal = {Journal of Fluid Science and Technology}, year = 2011, } @article{CTT100686131, author = {Rio Yokota and Lorena Barba}, title = {Comparing the treecode with FMM on GPUs for vortex particle simulations of a leapfrogging vortex ring}, journal = {Computers and Fluids}, year = 2010, } @article{CTT100686135, author = {Rio Yokota and Lorena Barba and Matthew Knepley}, title = {PetRBF–A parallel O(N) algorithm for radial basis function interpolation with Gaussians}, journal = {Computer Methods in Applied Mechanics and Engineering}, year = 2010, } @article{CTT100686134, author = {Rio Yokota and Shinnosuke Obi}, title = {Comparing vortex methods and finite difference methods in a homogeneous turbulent shear flow}, journal = {International Journal for Numerical Methods in Fluids}, year = 2009, } @article{CTT100686136, author = {Rio Yokota and Tetsu Narumi and Ryuji Sakamaki and Shun Kameoka and Shinnosuke Obi and Kenji Yasuoka}, title = {Fast multipole methods on a cluster of GPUs for the meshless simulation of turbulence}, journal = {Computer Physics Communications}, year = 2009, } @article{CTT100686137, author = {Rio Yokota and Tarun Kumar Sheel and Shinnosuke Obi}, title = {Calculation of isotropic turbulence using a pure Lagrangian vortex method}, journal = {Journal of Computational Physics}, year = 2007, } @inproceedings{CTT100906352, author = {Tomoya Takahashi and Shingo Yashima and Kohta Ishikawa and Ikuro Sato and Rio Yokota}, title = {Pixel-level Contrastive Learning of Driving Videos with Optical Flow}, booktitle = {Proc. CVPR workshop 2023}, year = 2023, } @inproceedings{CTT100890866, author = {Aoyu Li and Ikuro Sato and Kohta Ishikawa and Rei Kawakami and Rio Yokota}, title = {Informative Sample-Aware Proxy for Deep Metric Learning}, booktitle = {}, year = 2022, } @inproceedings{CTT100895747, author = {RYU TADOKORO and HIROKATSU KATAOKA and REI KAWAKAMI and RIO YOKOTA and NAKAMASA INOUE}, title = {蒸留画像による事前学習効果についての検討}, booktitle = {講演論文集}, year = 2022, } @inproceedings{CTT100874414, author = {Qianxiang Ma and Sameer Deshmukh and Rio Yokota}, title = {Scalable Linear Time Dense Direct Solver for 3-D Problems Without Trailing Sub-Matrix Dependencies}, booktitle = {}, year = 2022, } @inproceedings{CTT100890864, author = {Hiroki Naganuma and Kartik Ahuja and Ioannis Mitliagkas and Shiro Takagi and Tetsuya Motokawa and Rio Yokota and Kohta Ishikawa and Ikuro Sato}, title = {Empirical Study on Optimizer Selection for Out-of-Distribution Generalization}, booktitle = {Proc. NeurIPS 2022}, year = 2022, } @inproceedings{CTT100882020, author = {Akihiro Ida and 荻田 武史 and 伊田 明弘 and 荻田 武史 and Rio Yokota}, title = {対称ブロック低ランク行列の精度保証付き固有値問題解法}, booktitle = {}, year = 2022, } @inproceedings{CTT100881749, author = {Rio Yokota}, title = {Matrices in Deep Neural Networks and How to Compute Them in Parallel}, booktitle = {}, year = 2022, } @inproceedings{CTT100890860, author = {Tomoya Takahashi and 八嶋晋吾 and 石川康太 and Ikuro Sato and Rio Yokota}, title = {走行動画の大規模自己教師あり学習の検討と計画}, booktitle = {MIRUブックレット}, year = 2022, } @inproceedings{CTT100890854, author = {Aoyu Li and Ikuro Sato and 石川康太 and Rei Kawakami and Rio Yokota}, title = {Informative Sample-Aware Proxy for Deep Metric Learning}, booktitle = {MIRUブックレット}, year = 2022, } @inproceedings{CTT100866763, author = {Hirokatsu Kataoka and Ryo Hayamizu and Ryosuke Yamada and Kodai Nakashima and Sora Takashima and Xinyu Zhang and Edgar Josafat Martinez-Noriega and Nakamasa Inoue and Rio Yokota}, title = {Replacing Labeled Real-image Datasets with Auto-generated Contours}, booktitle = {}, year = 2022, } @inproceedings{CTT100865536, author = {Hana Hoshino and Kei Ota and Asako Kanezaki and Rio Yokota}, title = {OPIRL: Sample Efficient Off-Policy Inverse Reinforcement Learning via Distribution Matching}, booktitle = {}, year = 2022, } @inproceedings{CTT100869126, author = {Muhammad Ridwan Apriansyah and Rio Yokota}, title = {Parallel QR Factorization of Block Low-rank Matrices}, booktitle = {}, year = 2022, } @inproceedings{CTT100869125, author = {Sameer Satish Deshmukh and Rio Yokota}, title = {Acceleration of O(N) Solvers for Large Dense Matrices}, booktitle = {}, year = 2022, } @inproceedings{CTT100866867, author = {Shiyukai Nakamura and Rio Yokota}, title = {Vision Transformerにおけるバッチサイズの汎化性能への影響}, booktitle = {}, year = 2022, } @inproceedings{CTT100866866, author = {Hiro Ishii and Rio Yokota}, title = {深層学習における2次最適化の汎化性能の検証}, booktitle = {}, year = 2022, } @inproceedings{CTT100869127, author = {Thomas Spendlhofer and Rio Yokota}, title = {Iterative Refinement with Hierarchical Low-rank Preconditioners Using Mixed Precision}, booktitle = {}, year = 2022, } @inproceedings{CTT100862738, author = {Rio Yokota}, title = {二次最適化を用いた分散並列深層学習}, booktitle = {}, year = 2021, } @inproceedings{CTT100862737, author = {Rio Yokota}, title = {Approximations of Natural Gradient Descent in Distributed Training}, booktitle = {}, year = 2021, } @inproceedings{CTT100860388, author = {Shun Iwase and Xingyu Liu and Rawal Khirodkar and Rio Yokota and Kris M. Kitani}, title = {RePOSE: Real-Time Iterative Rendering and Refinement for 6D Object Pose Estimation}, booktitle = {}, year = 2021, } @inproceedings{CTT100862739, author = {Rio Yokota}, title = {階層的低ランク近似法に関するレビュー}, booktitle = {}, year = 2021, } @inproceedings{CTT100854272, author = {Yuichiro Ueno and Kazuki Osawa and Yohei Tsuji and Akira Naruse and Rio Yokota}, title = {Rich Information is Affordable: A Systematic Performance Analysis of Second-order Optimization Using K-FAC}, booktitle = {}, year = 2021, } @inproceedings{CTT100862736, author = {Hikaru Nakata and Nakamasa Inoue and Rio Yokota}, title = {Self-supervised Continual Pretraining for Class Incremental Image Classification}, booktitle = {Proc. CVPR CLVISION Workshop (Findings)}, year = 2021, } @inproceedings{CTT100862740, author = {Rio Yokota}, title = {スパコンを用いた大規模並列分散深層学習}, booktitle = {}, year = 2021, } @inproceedings{CTT100862741, author = {Rio Yokota}, title = {深層学習におけるヘッセ行列,フィッシャー行列,共分散行列の高速近似解法}, booktitle = {}, year = 2020, } @inproceedings{CTT100835680, author = {Rio Yokota}, title = {Degree of Approximation and Overhead of Computing Curvature}, booktitle = {}, year = 2020, } @inproceedings{CTT100832592, author = {Sameer Deshmukh and Rio Yokota}, title = {Distributed Memory Task-Based Block Low Rank Direct Solver}, booktitle = {}, year = 2020, } @inproceedings{CTT100835684, author = {Hikaru Nakata and Rio Yokota}, title = {画像分類のための継続的な事前学習における教師なし表現学習の堅牢性に関する検証}, booktitle = {}, year = 2020, } @inproceedings{CTT100832593, author = {Hiroyuki Ootomo and Rio Yokota}, title = {Randomized SVD on TensorCores}, booktitle = {}, year = 2020, } @inproceedings{CTT100835685, author = {Hiroyuki Ootomo and Rio Yokota}, title = {TensorコアのAPIの構造解析を用いた拡張ライブラリの開発}, booktitle = {}, year = 2020, } @inproceedings{CTT100835682, author = {Rio Yokota and Yohei Tsuji and Kazuki Osawa}, title = {Second Order Optimization for Distributed Data-parallel Deep Learning on 4000 GPUs}, booktitle = {}, year = 2020, } @inproceedings{CTT100835686, author = {Takahiro Shohata and Hiroki Naganuma and Rio Yokota}, title = {確率的重み付け平均法のラージバッチ学習における有用性の検証}, booktitle = {}, year = 2020, } @inproceedings{CTT100835687, author = {Rio Yokota}, title = {二次最適化を用いた巨大な言語モデルの学習およびFRNNを用いたプラズマ挙動予測}, booktitle = {}, year = 2020, } @inproceedings{CTT100832477, author = {Rise Ooi and Takeshi Iwashita and Takeshi Fukaya and Akihiro Ida and Rio Yokota}, title = {Effect of Mixed Precision Computing on H-Matrix Vector Multiplication in BEM Analysis}, booktitle = {Proceedings of HPC Asia 2020}, year = 2020, } @inproceedings{CTT100821422, author = {Muhammad Ridwan Apriansyah and Rio Yokota}, title = {QR Decomposition of Block Low-Rank Matrices}, booktitle = {}, year = 2020, } @inproceedings{CTT100821421, author = {Sameer Deshmukh and Rio Yokota}, title = {Distributed Memory Task-Based Block Low Rank Direct Solver}, booktitle = {}, year = 2020, } @inproceedings{CTT100803976, author = {Kazuki Osawa and Siddarth Swaroop and Anirudh Jain and Runa Eschenhagen and Richard E. Turner and Rio Yokota and Mohammad Emtiyaz Khan}, title = {Practical Deep Learning with Bayesian Principles}, booktitle = {}, year = 2019, } @inproceedings{CTT100819712, author = {Keita Yashima and 石川康太 and 佐藤育郎 and Akihiro Nomura and Rio Yokota and SATOSHI MATSUOKA}, title = {早期終了タイミングを予測する:深層学習における確率勾配の分布の変化点検出}, booktitle = {}, year = 2019, } @inproceedings{CTT100821426, author = {Hiroki Naganuma and Rio Yokota}, title = {On Empirical Analysis of Layer-wised Learning Rate Schedule}, booktitle = {}, year = 2019, } @inproceedings{CTT100821424, author = {Qianxing Ma and Rio Yokota}, title = {Runtime System for GPU-based Hierarchical LU factorization}, booktitle = {}, year = 2019, } @inproceedings{CTT100821423, author = {Hiroyuki Ootomo and Rio Yokota}, title = {TSQR on TensorCores}, booktitle = {}, year = 2019, } @inproceedings{CTT100807736, author = {Satoshi Ohshima and Ichitaro Yamazaki and Akihiro Ida and Rio Yokota}, title = {Optimization of Numerous Small Dense-Matrix–Vector Multiplications in H-matrix Arithmetic on GPU}, booktitle = {}, year = 2019, } @inproceedings{CTT100821425, author = {Hiroyuki Ootomo and Rio Yokota}, title = {Tensorコアを用いたTSQR}, booktitle = {}, year = 2019, } @inproceedings{CTT100815305, author = {Yohei Tsuji and Kazuki Osawa and Yuichiro Ueno and Akira Naruse and Rio Yokota and Satoshi Matsuoka}, title = {Performance Optimizations and Analysis of Distributed Deep Learning with Approximated Second-Order Optimization Method}, booktitle = {Proceedings of the 48th International Conference on Parallel Processing: Workshops}, year = 2019, } @inproceedings{CTT100802444, author = {H. Ootomo and R. Yokota}, title = {GPU Implementation of TSQR Using Tensor Cores}, booktitle = {}, year = 2019, } @inproceedings{CTT100802443, author = {Peter Spalthoff and Rio Yokota}, title = {Flexible and Simplistic Hierarchical Matrix-Based Fast Direct Solver}, booktitle = {}, year = 2019, } @inproceedings{CTT100793663, author = {Kazuki Osawa and Yohei Tsuji and Yuichiro Ueno and Akira Naruse and Rio Yokota and Satoshi Matsuoka}, title = {Second-order Optimization Method for Large Mini-batch: Training ResNet-50 on ImageNet in 35 Epochs}, booktitle = {}, year = 2019, } @inproceedings{CTT100793662, author = {Hiroki Naganuma and Rio Yokota}, title = {Effectiveness of Smoothing for Large-batch Training Using Natural Gradient Descent}, booktitle = {}, year = 2019, } @inproceedings{CTT100835681, author = {Rio Yokota}, title = {Recent Trends in Hierarchical Low-Rank Approximation Methods}, booktitle = {}, year = 2019, } @inproceedings{CTT100793660, author = {Yuichiro Ueno and Rio Yokota}, title = {Exhaustive Study of Hierarchical AllReduce Patterns for Large Messages Between GPUs}, booktitle = {}, year = 2019, } @inproceedings{CTT100793661, author = {Hiroki Naganuma and Rio Yokota}, title = {A Performance Improvement Approach for Second-Order Optimization in Large Mini-batch Training}, booktitle = {}, year = 2019, } @inproceedings{CTT100793654, author = {Hiroyuki Ootomo and Rio Yokota}, title = {Batched QR Decomposition Using TensorCores}, booktitle = {}, year = 2019, } @inproceedings{CTT100793653, author = {Hiroki Naganuma and Rio Yokota}, title = {Smoothing of the Objective Function for Large Scale Parallel Deep Learning}, booktitle = {}, year = 2019, } @inproceedings{CTT100793659, author = {Hiroki Naganuma and Rio Yokota}, title = {Improving the Generalization Gap in Large-batch Training Using Noise Injection}, booktitle = {}, year = 2019, } @inproceedings{CTT100793658, author = {Rio Yokota and Kazuki Osawa and Yohei Tsuji and Yuichiro Ueno and Akira Naruse}, title = {Second Order Optimization for Large Scale Parallel Deep Learning}, booktitle = {}, year = 2019, } @inproceedings{CTT100793657, author = {Kazuki Osawa and Rio Yokota and Chuan-Sheng Foo and Vijay Chandrasekhar}, title = {Second Order Optimization for Large Scale Parallel Deep Learning Through Analysis of the Fisher Information Matrix}, booktitle = {}, year = 2019, } @inproceedings{CTT100793655, author = {Hikaru Nakata and Kazuki Osawa and Rio Yokota}, title = {Variational Inference in Deep Learning Using Natural Gradient Descent}, booktitle = {}, year = 2019, } @inproceedings{CTT100835683, author = {Rio Yokota}, title = {Kronecker Factorization for Second Order Optimization in Deep Learning}, booktitle = {}, year = 2019, } @inproceedings{CTT100771718, author = {Hiroki Naganuma and Shun Iwase and Linsho Kaku and Hikaru Nakata and Rio Yokota}, title = {Hyper-parameter Tuning of Approximate Natural Gradient Methods for Highly Parallel Distributed Deep Learning}, booktitle = {}, year = 2018, } @inproceedings{CTT100773722, author = {Rio Yokota}, title = {Optimization Methods for Large Scale Distributed Deep Learning}, booktitle = {}, year = 2018, } @inproceedings{CTT100773723, author = {Rio Yokota}, title = {Early Application Results on TSUBAME 3}, booktitle = {}, year = 2018, } @inproceedings{CTT100773724, author = {Rio Yokota}, title = {Scaling Deep Learning to Thousands of GPUs}, booktitle = {}, year = 2018, } @inproceedings{CTT100773725, author = {Rio Yokota}, title = {Energy Conserving Fast Multipole Methods for the Calculation of Long-range Interactions}, booktitle = {}, year = 2018, } @inproceedings{CTT100759345, author = {Ichitaro Yamazaki and Ahmad Abdelfattah and Akihiro Ida and Satoshi Ohshima and Stanimire Tomov and Rio Yokota and Jack Dongarra}, title = {Analyzing Performance of BiCGStab with Hierarchical Matrix on GPU clusters}, booktitle = {}, year = 2018, } @inproceedings{CTT100759344, author = {Hiroyuki Ohtomo and Kazuki Osawa and Rio yokota}, title = {Deep Learning Using Kronecker-factored Approximation of Fisher Matrix}, booktitle = {}, year = 2018, } @inproceedings{CTT100773726, author = {Rio Yokota}, title = {Can we use Hierarchical Low-Rank Approximation for Deep Learning?}, booktitle = {}, year = 2018, } @inproceedings{CTT100760853, author = {Hiroyuki Otomo and Kazuki Osawa and Rio Yokota}, title = {Distributed Learning of Deep Neural Networks Using the Kronecker Factorization of the Fisher Information Matrix}, booktitle = {}, year = 2018, } @inproceedings{CTT100759346, author = {Satoshi Ohshima and Ichitaro Yamazaki and Akihiro Ida and Rio Yokota}, title = {Optimization of Hierarchical Matrix Computation on GPU}, booktitle = {}, year = 2018, } @inproceedings{CTT100759343, author = {Yuji Kuwamura and Kazuki Osawa and Rio Yokota}, title = {Hyper-parameter Tuning for Approximate Natural Gradient Methods}, booktitle = {}, year = 2018, } @inproceedings{CTT100759341, author = {Hiroki Naganuma and Rio Yokota}, title = {Accelerating Convolutional Neural Networks Using Low Precision Arithmetic}, booktitle = {}, year = 2018, } @inproceedings{CTT100759338, author = {Hiroki Naganuma and Rio Yokota}, title = {Verification of Low-precision Arithmetic for the Acceleration of Convolutional Neural Networks}, booktitle = {}, year = 2017, } @inproceedings{CTT100755398, author = {K. Osawa and A. Sekiya and H. Naganuma and R. Yokota}, title = {Acceleration of Convolutional Neural Networks Using Low-Rank Tensor Decomposition}, booktitle = {}, year = 2017, } @inproceedings{CTT100755397, author = {H. Naganuma and A. Sekiya and K. Osawa and H. Otomo and Y. Kuwamura and R. Yokota}, title = {Evaluating the Performance of Deep Learning with Low Precision Arithmetic}, booktitle = {}, year = 2017, } @inproceedings{CTT100751154, author = {Kazuki Oosawa and Rio Yokota}, title = {Evaluating the Compression Efficiency of the Filters in Convolutional Neural Networks}, booktitle = {}, year = 2017, } @inproceedings{CTT100755396, author = {H. Naganuma and K. Osawa and A. Sekiya and R. Yokota}, title = {Acceleration of Compressed Models in Deep Learning Using Half Precision Arithmetic}, booktitle = {}, year = 2017, } @inproceedings{CTT100751153, author = {Mustafa AbdulJabbar and Mohammed Al Farhan and Rio Yokota and David Keyes}, title = {Performance Evaluation of Computation and Communication Kernels of the Fast Multipole Method on Intel Manycore Architecture}, booktitle = {}, year = 2017, } @inproceedings{CTT100751142, author = {Kazuki Oosawa and Akira Sekiya and Hiroki Naganuma and Rio Yokota}, title = {Accelerating Matrix Multiplication in Deep Learning by Using Low-Rank Approximation}, booktitle = {}, year = 2017, } @inproceedings{CTT100751150, author = {Satoshi Ohshima and Ichitaro Yamazaki and Akihiro Ida and Rio Yokota}, title = {Optimization of Hierarchical Matrix Computations on a Cluster of GPUs}, booktitle = {}, year = 2017, } @inproceedings{CTT100751139, author = {Mustafa AbdulJabbar and George Markomanolis and Huda Ibeid and Rio Yokota and David Keyes}, title = {Communication Reducing Algorithms for Distributed Heirarchical N-Body Methods}, booktitle = {Lecture Notes in Computer Science}, year = 2017, } @inproceedings{CTT100751140, author = {Rio Yokota}, title = {Hierarchical Low-Rank Approximations at Extreme Scale}, booktitle = {}, year = 2017, } @inproceedings{CTT100751136, author = {Kazuki Oosawa and Akira Sekiya and Hiroki Naganuma and Rio Yokota}, title = {Accelerating Convolutional Neural Networks Using Low-Rank Approximation}, booktitle = {Proceedings of the 22nd Conference of Japan Computational Engineering Society}, year = 2017, } @inproceedings{CTT100737180, author = {Yoshifumi Motoyama and Toshio Endo and SATOSHI MATSUOKA and Rio Yokota and Keisuke Fukuda and 佐藤 育郎}, title = {Using Low-Rank Approximation in Convolutional Neural Networks}, booktitle = {2017-HPC-158 No.25}, year = 2017, } @inproceedings{CTT100751133, author = {Akira Sekiya and Kazuki Oosawa and Hiroki Naganuma and Rio Yokota}, title = {Acceleration of Matrix Multiplication in Deep Learning Using Low-Rank Approximation}, booktitle = {}, year = 2017, } @inproceedings{CTT100751129, author = {Rio Yokota}, title = {Compute-Memory Tradeoff in Hierarchical Low-Rank Approximation Methods}, booktitle = {}, year = 2017, } @inproceedings{CTT100751127, author = {Rio Yokota}, title = {Energy Conservation of Fast Multipole Methods in Classical Molecular Dynamics Simulations}, booktitle = {}, year = 2017, } @inproceedings{CTT100737166, author = {Keisuke Fukuda and Motohiko Matsuda and Naoya Maruyama and Rio Yokota and Kenjiro Taura and Satoshi Matsuoka}, title = {Tapas: An Implicitly Parallel ProgrammingFramework For Hierarchical N-body Algorithms}, booktitle = {The 22nd IEEE International Conference on Parallel And Distributed Systems}, year = 2016, } @inproceedings{CTT100751126, author = {Rio Yokota}, title = {Improving Data Locality of Fast Multipole Methods}, booktitle = {}, year = 2016, } @inproceedings{CTT100718835, author = {Rio Yokota}, title = {Fast Multipole Method as a Matrix-free Hierarchical Low-rank Approximation}, booktitle = {}, year = 2016, } @inproceedings{CTT100718802, author = {Rio Yokota}, title = {Fast Multipole Method Library for Multiple Architectures and its Application to Molecular and Fluid Simulations}, booktitle = {}, year = 2016, } @inproceedings{CTT100718803, author = {Rio Yokota}, title = {Perforamance Portability of FMM}, booktitle = {}, year = 2016, } @inproceedings{CTT100751123, author = {Huda Ibeid and Rio Yokota and David Keyes}, title = {A Matrix-Free Preconditioner for Elliptic Solvers Based on the Fast Multipole Method}, booktitle = {}, year = 2016, } @inproceedings{CTT100718829, author = {Rio Yokota}, title = {A Common API for Fast Multipole Methods}, booktitle = {}, year = 2016, } @inproceedings{CTT100751125, author = {Rio Yokota}, title = {Auto-tunable Parameters in FMM}, booktitle = {}, year = 2015, } @inproceedings{CTT100718833, author = {Rio Yokota and Francois-Henri Rouet and Xiaoye Sherry Li}, title = {Comparison of FMM and HSS at Large Scale}, booktitle = {}, year = 2015, } @inproceedings{CTT100718834, author = {Rio Yokota and Huda Ibeid and David Keyes}, title = {Preconditioning Sparse Matrices Using a Highly Scalable Fast Multipole Method}, booktitle = {}, year = 2015, } @inproceedings{CTT100751120, author = {Rio Yokota}, title = {Various Implementations of FMM and Their Performance on Future Architectures}, booktitle = {}, year = 2015, } @inproceedings{CTT100751118, author = {Huda Ibeid and Jennifer Pestana and Rio Yokota and David Keyes}, title = {Fast Multipole Method as Preconditioner}, booktitle = {}, year = 2015, } @inproceedings{CTT100718836, author = {Rio Yokota}, title = {ExaFMM -- a Testbed for Comparing Various Implementations of the FMM}, booktitle = {}, year = 2015, } @inproceedings{CTT100718842, author = {Huda Ibeid and Rio Yokota and Jennifer Pestana and David Keyes}, title = {Fast Multipole Preconditioners for Sparse Linear Solvers}, booktitle = {}, year = 2014, } @inproceedings{CTT100718843, author = {Rio Yokota and David Keyes}, title = {Communication Complexity of the Fast Multipole Method and its Algebraic Variants}, booktitle = {}, year = 2014, } @inproceedings{CTT100718845, author = {Hatem Ltaief and Rio Yokota}, title = {High Performance Numerical Algorithms for Seismic and Reservoir Simulations}, booktitle = {}, year = 2014, } @inproceedings{CTT100718846, author = {Rio Yokota}, title = {Fast N-body Methods as a Compute-Bound Preconditioner for Sparse Solvers on GPUs}, booktitle = {}, year = 2014, } @inproceedings{CTT100718848, author = {Jennifer Pestana and Rio Yokota and Huda Ibeid and David Keyes}, title = {Fast Multipole Method Preconditioning}, booktitle = {}, year = 2013, } @inproceedings{CTT100759347, author = {Abdelhalim Amer and Naoya Maruyama and Miquel Pericas and Kenjiro Taura and Rio Yokota and Satoshi Matsuoka}, title = {Fork-Join and Data-Driven Execution Models on Multi-core Architectures: Case Study of the FMM}, booktitle = {Lecture notes in computer science, LNCS}, year = 2013, } @inproceedings{CTT100718851, author = {Rio Yokota}, title = {Advances in Fast Multipole Methods for Scalable Electrostatics Calculations}, booktitle = {}, year = 2013, } @inproceedings{CTT100718852, author = {Abdul Abdelfatteh and Hatem Ltaief and Rio Yokota}, title = {Investigating New Numerical Techniques for Reservoir Simulations on GPUs}, booktitle = {}, year = 2013, } @inproceedings{CTT100718855, author = {Huda Ibeid and Rio Yokota and David Keyes}, title = {Fast Multipole Method as a Preconditioner}, booktitle = {}, year = 2013, } @inproceedings{CTT100718860, author = {Kenjiro Taura and Jun Nakashima and Rio Yokota and Naoya Maruyama}, title = {A Task Parallelism Meets Fast Multipole Methods}, booktitle = {}, year = 2012, } @inproceedings{CTT100718863, author = {Rio Yokota}, title = {Petascale Fast Multipole Methods on GPUs}, booktitle = {}, year = 2012, } @inproceedings{CTT100718871, author = {Hatem Ltaief and Rio Yokota}, title = {Data-Driven Fast Multipole Method on Distributed Memory Systems with Hardware Accelerators}, booktitle = {}, year = 2012, } @inproceedings{CTT100718868, author = {Enas Yunis and Rio Yokota and Aron Ahmadia}, title = {Scalable Force Directed Graph Layout Algorithms Using Fast Multipole Methods}, booktitle = {}, year = 2012, } @inproceedings{CTT100718866, author = {Rio Yokota}, title = {Petascale Fast Multipole Methods on GPUs}, booktitle = {}, year = 2012, } @inproceedings{CTT100718876, author = {Rio Yokota and Tetsu Narumi and Lorena Barba and Kenji Yasuoka}, title = {Scaling Fast Multipole Methods up to 4000 GPUs}, booktitle = {}, year = 2012, } @inproceedings{CTT100718874, author = {Rio Yokota and Lorena Barba}, title = {Recent Trends in Hierarchical N-body Methods on GPUs}, booktitle = {}, year = 2012, } @inproceedings{CTT100718878, author = {Hoang Vu Nguyen and Rio Yokota and Georgiy Stenchikov}, title = {A Parallel Numerical Simulation of Dust Particles Using Direct Numerical Simulation}, booktitle = {}, year = 2012, } @inproceedings{CTT100718877, author = {Rio Yokota}, title = {Running Fast Multipole Method on the Full Node of TSUBAME and K computer}, booktitle = {}, year = 2012, } @inproceedings{CTT100718882, author = {Rio Yokota}, title = {Fast N-body Methods on Many-core and Heterogenous Systems}, booktitle = {}, year = 2012, } @inproceedings{CTT100718885, author = {Rio Yokota}, title = {Petaflops Scale Turbulence Simulation on TSUBAME 2.0}, booktitle = {}, year = 2011, } @inproceedings{CTT100718887, author = {Tetsu Narumi and Rio Yokota and Lorena Barba and Kenji Yasuoka}, title = {Petascale Turbulence Simulation Using FMM}, booktitle = {}, year = 2011, } @inproceedings{CTT100718889, author = {Rio Yokota and Lorena Barba}, title = {Parameter Tuning of a Hybrid Treecode-FMM on GPUs}, booktitle = {}, year = 2011, } @inproceedings{CTT100718888, author = {Rio Yokota and Lorena Barba}, title = {Fast Multipole Method vs. Spectral Methods for the Simulation of Isotropic Turbulence on GPUs}, booktitle = {}, year = 2011, } @inproceedings{CTT100718890, author = {Rio Yokota and Lorena Barba}, title = {Large Scale Multi-GPU FMM for Bioelectrostatics}, booktitle = {}, year = 2011, } @inproceedings{CTT100718891, author = {Rio Yokota}, title = {12 Steps to a Fast Multipole Method on GPUs}, booktitle = {}, year = 2011, } @inproceedings{CTT100718894, author = {Rio Yokota and Jaydeep Bardhan and Matthew Knepley and Lorena Barba}, title = {(Really) Fast Macromolecular Electrostatics -- Fast Algorithms, Open Software and Accelerated Computing}, booktitle = {}, year = 2010, } @inproceedings{CTT100718895, author = {Rio Yokota and Lorena Barba}, title = {RBF Interpolation using Gaussians with Domain Decomposition on GPUs}, booktitle = {}, year = 2010, } @inproceedings{CTT100718896, author = {Rio Yokota and Lorena Barba}, title = {Performance of the Fast Multipole Method on GPUs Using Various Kernels}, booktitle = {}, year = 2010, } @inproceedings{CTT100718897, author = {Rio Yokota and Lorena Barba}, title = {Comparing the Treecode with FMM on GPUs for Vortex Particle Simulations of a Leapfrogging Vortex Ring}, booktitle = {}, year = 2010, } @inproceedings{CTT100718898, author = {Rio Yokota and Shinnosuke Obi}, title = {Lagrangian Simulation of Turbulence Using Vortex Methods}, booktitle = {}, year = 2010, } @inproceedings{CTT100718899, author = {Rio Yokota}, title = {Range of Applications for the Fast Multipole Method on GPUs}, booktitle = {}, year = 2010, } @inproceedings{CTT100718900, author = {Tsuyoshi Hamada and Rio Yokota and Keigo Nitadori and Tetsu Narumi and Kenji Yasuoka and Makoto Taiji and Kyoshi Oguri}, title = {42 TFlops Hierarchical N-Body Simulation on GPUs with Applications in Both Astrophysics and Turbulence}, booktitle = {}, year = 2009, } @inproceedings{CTT100718905, author = {Rio Yokota and Shinnosuke Obi}, title = {Validation of Vortex Methods in a Turblent Channel Flow}, booktitle = {}, year = 2009, } @inproceedings{CTT100718904, author = {Rio Yokota and Koji Fukagata and Shinnosuke Obi}, title = {Lagrangian Vortex Methods in Turbulent Channel Flows}, booktitle = {}, year = 2009, } @inproceedings{CTT100718906, author = {Rio Yokota and Tetsu Narumi and Ryuji Sakamaki and Kenji Yasuoka and Shinnosuke Obi}, title = {Fast Multipole Methods on GPUs for the Meshfree Simulation of Turbulence}, booktitle = {}, year = 2009, } @inproceedings{CTT100718907, author = {Rio Yokota and Tetsu Narumi and Ryuji Sakamaki and Shun Kameoka and Kenji Yasuoka and Shinnosuke Obi}, title = {DNS of Homogeneous Turbulence Using Vortex Methods Accelerated by the FMM on a Cluster of GPUs}, booktitle = {}, year = 2009, } @inproceedings{CTT100718908, author = {Rio Yokota and Tetsu Narumi and Ryuji Sakamaki and Shun Kameoka and Kenji Yasuoka and Shinnosuke Obi}, title = {Meshfree Simulation of Turbulence Using the Fast Multipole Methods on GPUs}, booktitle = {}, year = 2008, } @inproceedings{CTT100718909, author = {Rio Yokota and Shinnosuke Obi}, title = {Vortex Method Simulation of Turbulent Channel Flow}, booktitle = {}, year = 2008, } @inproceedings{CTT100718910, author = {Rio Yokota and Shinnosuke Obi}, title = {Direct Numerical Simulation of Homogeneous Shear Flow Using Vortex Methods}, booktitle = {}, year = 2008, } @inproceedings{CTT100718912, author = {Rio Yokota and Shinnosuke Obi}, title = {Mesh-Free Simulation of the Homogeneous Shear Flow Using Vortex Methods}, booktitle = {}, year = 2008, } @inproceedings{CTT100718913, author = {Akira Sato and Rio Yokota and Shinnosuke Obi}, title = {Computation of Wing-Tip Vortex by a Three-Dimensional Vortex Method}, booktitle = {}, year = 2007, } @inproceedings{CTT100718915, author = {Rio Yokota and Tetsu Narumi and Kenji Yasuoka and Toshikazu Ebisuzaki and Shinnosuke Obi}, title = {Mesh-Free Direct Numerical Simulation of Turbulence Using the Vortex Method on Parallel MDGRAPE-3 Boards Along with the Fast Multipole Method}, booktitle = {}, year = 2007, } @inproceedings{CTT100718916, author = {Rio Yokota and Shinnosuke Obi}, title = {Pure Lagrangian Vortex Methods for the Simulation of Decaying Isotropic Turbulence}, booktitle = {}, year = 2007, } @inproceedings{CTT100718917, author = {Rio Yokota and Shinnosuke Obi}, title = {Vortex Methods for the Calculation of Homogeneous Shear Flows}, booktitle = {}, year = 2007, } @inproceedings{CTT100718918, author = {Rio Yokota and Shinnosuke Obi}, title = {Mesh-Free Turbulence Simulation Using Vortex Methods}, booktitle = {}, year = 2007, } @inproceedings{CTT100718919, author = {Rio Yokota and Shinnosuke Obi}, title = {Simulation of Homogeneous Isotropic Turbulence Using the Vortex Method}, booktitle = {}, year = 2006, } @inproceedings{CTT100718920, author = {Rio Yokota and Shinnosuke Obi}, title = {Calculation of Fluid Structure Interaction Using VEM and BEM}, booktitle = {}, year = 2006, } @inproceedings{CTT100718921, author = {Rio Yokota and Shinnosuke Obi}, title = {Simulation of a Wake Using a 3-D Vortex Element Method}, booktitle = {}, year = 2006, } @inproceedings{CTT100718922, author = {Rio Yokota and Shinnosuke Obi}, title = {Vortex Flow Simulation Between Multipole Bridge Decks}, booktitle = {}, year = 2006, } @inproceedings{CTT100718924, author = {Rio Yokota and Shinnosuke Obi}, title = {Vortex Flow Simulation of Multipole Bluff Bodies}, booktitle = {}, year = 2005, } @inproceedings{CTT100718923, author = {Rio Yokota and Shinnosuke Obi}, title = {Vortex Flow Simulation of Multipole Bluff Bodies}, booktitle = {}, year = 2005, }