@inproceedings{lin2020audiovisual, title={Audiovisual Transformer with Instance Attention for Audio-Visual Event Localization}, author={Lin, Yan-Bo and Wang, Yu-Chiang Frank}, booktitle={Proceedings of the Asian Conference on Computer Vision}, year={2020} }