@article{visualhow_tpami, title={Every Problem, Every Step, All In Focus: Learning to Solve Vision-Language Problems with Integrated Attention}, author={Chen, Xianyu and Yang, Jinhui and Chen, Shi and Wang, Louis and Jiang, Ming and Zhao, Qi }, journal={IEEE Transactions on Pattern Analysis and Machine Intelligence}, year={2024}, publisher={IEEE} }