@article{CTT100832594, author = {Kazuki Osawa and Yohei Tsuji and Yuichiro Ueno and Akira Naruse and Chuan-Sheng Foo and Rio Yokota}, title = {Scalable and Practical Natural Gradient for Large-Scale Deep Learning}, journal = {IEEE Transactions on Pattern Analysis and Machine Intelligence}, year = 2020, } @inproceedings{CTT100854272, author = {Yuichiro Ueno and Kazuki Osawa and Yohei Tsuji and Akira Naruse and Rio Yokota}, title = {Rich Information is Affordable: A Systematic Performance Analysis of Second-order Optimization Using K-FAC}, booktitle = {}, year = 2021, } @inproceedings{CTT100815305, author = {Yohei Tsuji and Kazuki Osawa and Yuichiro Ueno and Akira Naruse and Rio Yokota and Satoshi Matsuoka}, title = {Performance Optimizations and Analysis of Distributed Deep Learning with Approximated Second-Order Optimization Method}, booktitle = {Proceedings of the 48th International Conference on Parallel Processing: Workshops}, year = 2019, } @inproceedings{CTT100793663, author = {Kazuki Osawa and Yohei Tsuji and Yuichiro Ueno and Akira Naruse and Rio Yokota and Satoshi Matsuoka}, title = {Second-order Optimization Method for Large Mini-batch: Training ResNet-50 on ImageNet in 35 Epochs}, booktitle = {}, year = 2019, } @inproceedings{CTT100793660, author = {Yuichiro Ueno and Rio Yokota}, title = {Exhaustive Study of Hierarchical AllReduce Patterns for Large Messages Between GPUs}, booktitle = {}, year = 2019, } @inproceedings{CTT100793658, author = {横田理央 and 大沢和樹 and 辻陽平 and 上野裕一郎 and 成瀬彰}, title = {大規模並列深層学習における2次の最適化手法の効果}, booktitle = {}, year = 2019, }