method: danet2022-07-11

Authors: peking university

Description: TextVQA spatial reasoning method using depth information

@article{li2022toward, title={Toward 3d spatial reasoning for human-like text-based visual question answering}, author={Li, Hao and Huang, Jinfa and Jin, Peng and Song, Guoli and Wu, Qi and Chen, Jie}, journal={arXiv preprint arXiv:2209.10326}, year={2022} }