@inproceedings{CTT100885102, author = {Ruoyue Shen and Nakamasa Inoue and Koichi Shinoda}, title = {Text-Guided Object Detector for Multi-modal Video Question Answering}, booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision (WACV), 2023}, year = 2023, }